llvm_backend_expr.cpp 172 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889389038913892389338943895389638973898389939003901390239033904390539063907390839093910391139123913391439153916391739183919392039213922392339243925392639273928392939303931393239333934393539363937393839393940394139423943394439453946394739483949395039513952395339543955395639573958395939603961396239633964396539663967396839693970397139723973397439753976397739783979398039813982398339843985398639873988398939903991399239933994399539963997399839994000400140024003400440054006400740084009401040114012401340144015401640174018401940204021402240234024402540264027402840294030403140324033403440354036403740384039404040414042404340444045404640474048404940504051405240534054405540564057405840594060406140624063406440654066406740684069407040714072407340744075407640774078407940804081408240834084408540864087408840894090409140924093409440954096409740984099410041014102410341044105410641074108410941104111411241134114411541164117411841194120412141224123412441254126412741284129413041314132413341344135413641374138413941404141414241434144414541464147414841494150415141524153415441554156415741584159416041614162416341644165416641674168416941704171417241734174417541764177417841794180418141824183418441854186418741884189419041914192419341944195419641974198419942004201420242034204420542064207420842094210421142124213421442154216421742184219422042214222422342244225422642274228422942304231423242334234423542364237423842394240424142424243424442454246424742484249425042514252425342544255425642574258425942604261426242634264426542664267426842694270427142724273427442754276427742784279428042814282428342844285428642874288428942904291429242934294429542964297429842994300430143024303430443054306430743084309431043114312431343144315431643174318431943204321432243234324432543264327432843294330433143324333433443354336433743384339434043414342434343444345434643474348434943504351435243534354435543564357435843594360436143624363436443654366436743684369437043714372437343744375437643774378437943804381438243834384438543864387438843894390439143924393439443954396439743984399440044014402440344044405440644074408440944104411441244134414441544164417441844194420442144224423442444254426442744284429443044314432443344344435443644374438443944404441444244434444444544464447444844494450445144524453445444554456445744584459446044614462446344644465446644674468446944704471447244734474447544764477447844794480448144824483448444854486448744884489449044914492449344944495449644974498449945004501450245034504450545064507450845094510451145124513451445154516451745184519452045214522452345244525452645274528452945304531453245334534453545364537453845394540454145424543454445454546454745484549455045514552455345544555455645574558455945604561456245634564456545664567456845694570457145724573457445754576457745784579458045814582458345844585458645874588458945904591459245934594459545964597459845994600460146024603460446054606460746084609461046114612461346144615461646174618461946204621462246234624462546264627462846294630463146324633463446354636463746384639464046414642464346444645464646474648464946504651465246534654465546564657465846594660466146624663466446654666466746684669467046714672467346744675467646774678467946804681468246834684468546864687468846894690469146924693469446954696469746984699470047014702470347044705470647074708470947104711471247134714471547164717471847194720472147224723472447254726472747284729473047314732473347344735473647374738473947404741474247434744474547464747474847494750475147524753475447554756475747584759476047614762476347644765476647674768476947704771477247734774477547764777477847794780478147824783478447854786478747884789479047914792479347944795479647974798479948004801480248034804480548064807480848094810481148124813481448154816481748184819482048214822482348244825482648274828482948304831483248334834483548364837483848394840484148424843484448454846484748484849485048514852485348544855485648574858485948604861486248634864486548664867486848694870487148724873487448754876487748784879488048814882488348844885488648874888488948904891489248934894489548964897489848994900490149024903490449054906490749084909491049114912491349144915491649174918491949204921492249234924492549264927492849294930493149324933493449354936493749384939494049414942494349444945494649474948494949504951495249534954495549564957495849594960496149624963496449654966496749684969497049714972497349744975497649774978497949804981498249834984498549864987498849894990499149924993499449954996499749984999500050015002500350045005500650075008500950105011501250135014501550165017501850195020502150225023502450255026502750285029503050315032503350345035503650375038503950405041504250435044504550465047504850495050505150525053505450555056505750585059506050615062506350645065506650675068506950705071507250735074507550765077507850795080508150825083508450855086508750885089509050915092509350945095509650975098509951005101510251035104510551065107510851095110511151125113511451155116511751185119512051215122512351245125512651275128512951305131513251335134513551365137513851395140514151425143514451455146514751485149515051515152515351545155515651575158515951605161516251635164516551665167516851695170517151725173517451755176517751785179518051815182518351845185518651875188518951905191519251935194519551965197519851995200520152025203520452055206520752085209521052115212521352145215521652175218521952205221522252235224522552265227522852295230523152325233523452355236523752385239524052415242524352445245524652475248524952505251525252535254525552565257525852595260526152625263526452655266526752685269527052715272527352745275527652775278527952805281528252835284528552865287528852895290529152925293529452955296529752985299530053015302530353045305530653075308530953105311531253135314531553165317531853195320532153225323532453255326532753285329533053315332533353345335533653375338533953405341534253435344534553465347534853495350535153525353535453555356535753585359536053615362536353645365536653675368536953705371537253735374537553765377537853795380538153825383538453855386538753885389539053915392539353945395539653975398539954005401540254035404540554065407540854095410541154125413541454155416541754185419542054215422542354245425542654275428542954305431543254335434543554365437543854395440544154425443544454455446544754485449545054515452545354545455545654575458545954605461546254635464546554665467546854695470547154725473547454755476547754785479548054815482548354845485548654875488548954905491549254935494549554965497
  1. gb_internal lbValue lb_emit_arith_matrix(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type, bool component_wise);
  2. gb_internal lbValue lb_emit_logical_binary_expr(lbProcedure *p, TokenKind op, Ast *left, Ast *right, Type *final_type) {
  3. lbModule *m = p->module;
  4. lbBlock *rhs = lb_create_block(p, "logical.cmp.rhs");
  5. lbBlock *done = lb_create_block(p, "logical.cmp.done");
  6. lbValue short_circuit = {};
  7. if (op == Token_CmpAnd) {
  8. lb_build_cond(p, left, rhs, done);
  9. short_circuit = lb_const_bool(m, t_llvm_bool, false);
  10. } else if (op == Token_CmpOr) {
  11. lb_build_cond(p, left, done, rhs);
  12. short_circuit = lb_const_bool(m, t_llvm_bool, true);
  13. }
  14. if (rhs->preds.count == 0) {
  15. lb_start_block(p, done);
  16. return short_circuit;
  17. }
  18. if (done->preds.count == 0) {
  19. lb_start_block(p, rhs);
  20. if (lb_is_expr_untyped_const(right)) {
  21. return lb_expr_untyped_const_to_typed(m, right, default_type(final_type));
  22. }
  23. return lb_build_expr(p, right);
  24. }
  25. Array<LLVMValueRef> incoming_values = {};
  26. Array<LLVMBasicBlockRef> incoming_blocks = {};
  27. array_init(&incoming_values, heap_allocator(), done->preds.count+1);
  28. array_init(&incoming_blocks, heap_allocator(), done->preds.count+1);
  29. for_array(i, done->preds) {
  30. incoming_values[i] = short_circuit.value;
  31. incoming_blocks[i] = done->preds[i]->block;
  32. }
  33. lb_start_block(p, rhs);
  34. lbValue edge = {};
  35. if (lb_is_expr_untyped_const(right)) {
  36. edge = lb_expr_untyped_const_to_typed(m, right, t_llvm_bool);
  37. } else {
  38. edge = lb_emit_conv(p, lb_build_expr(p, right), t_llvm_bool);
  39. }
  40. GB_ASSERT(edge.type == t_llvm_bool);
  41. incoming_values[done->preds.count] = edge.value;
  42. incoming_blocks[done->preds.count] = p->curr_block->block;
  43. lb_emit_jump(p, done);
  44. lb_start_block(p, done);
  45. LLVMTypeRef dst_type = lb_type(m, t_llvm_bool);
  46. LLVMValueRef phi = nullptr;
  47. GB_ASSERT(incoming_values.count == incoming_blocks.count);
  48. GB_ASSERT(incoming_values.count > 0);
  49. LLVMTypeRef phi_type = nullptr;
  50. for (LLVMValueRef incoming_value : incoming_values) {
  51. if (!LLVMIsConstant(incoming_value)) {
  52. phi_type = LLVMTypeOf(incoming_value);
  53. break;
  54. }
  55. }
  56. lbValue res = {};
  57. if (phi_type == nullptr) {
  58. phi = LLVMBuildPhi(p->builder, dst_type, "");
  59. LLVMAddIncoming(phi, incoming_values.data, incoming_blocks.data, cast(unsigned)incoming_values.count);
  60. res.value = phi;
  61. res.type = t_llvm_bool;
  62. } else {
  63. for_array(i, incoming_values) {
  64. LLVMValueRef incoming_value = incoming_values[i];
  65. LLVMTypeRef incoming_type = LLVMTypeOf(incoming_value);
  66. if (phi_type != incoming_type) {
  67. GB_ASSERT_MSG(LLVMIsConstant(incoming_value), "%s vs %s", LLVMPrintTypeToString(phi_type), LLVMPrintTypeToString(incoming_type));
  68. bool ok = !!LLVMConstIntGetZExtValue(incoming_value);
  69. incoming_values[i] = LLVMConstInt(phi_type, ok, false);
  70. }
  71. }
  72. // NOTE(bill): this now only uses i1 for the logic to prevent issues with corrupted booleans which are not of value 0 or 1 (e.g. 2)
  73. // Doing this may produce slightly worse code as a result but it will be correct behaviour
  74. phi = LLVMBuildPhi(p->builder, phi_type, "");
  75. LLVMAddIncoming(phi, incoming_values.data, incoming_blocks.data, cast(unsigned)incoming_values.count);
  76. res.value = phi;
  77. res.type = t_llvm_bool;
  78. }
  79. return lb_emit_conv(p, res, default_type(final_type));
  80. }
  81. gb_internal lbValue lb_emit_unary_arith(lbProcedure *p, TokenKind op, lbValue x, Type *type) {
  82. switch (op) {
  83. case Token_Add:
  84. return x;
  85. case Token_Not: // Boolean not
  86. case Token_Xor: // Bitwise not
  87. case Token_Sub: // Number negation
  88. break;
  89. case Token_Pointer:
  90. GB_PANIC("This should be handled elsewhere");
  91. break;
  92. }
  93. if (is_type_array_like(x.type)) {
  94. // IMPORTANT TODO(bill): This is very wasteful with regards to stack memory
  95. Type *tl = base_type(x.type);
  96. lbValue val = lb_address_from_load_or_generate_local(p, x);
  97. GB_ASSERT(is_type_array_like(type));
  98. Type *elem_type = base_array_type(type);
  99. // NOTE(bill): Doesn't need to be zero because it will be initialized in the loops
  100. lbAddr res_addr = lb_add_local(p, type, nullptr, false, true);
  101. lbValue res = lb_addr_get_ptr(p, res_addr);
  102. bool inline_array_arith = lb_can_try_to_inline_array_arith(type);
  103. i32 count = cast(i32)get_array_type_count(tl);
  104. LLVMTypeRef vector_type = nullptr;
  105. if (op != Token_Not && lb_try_vector_cast(p->module, val, &vector_type)) {
  106. LLVMValueRef vp = LLVMBuildPointerCast(p->builder, val.value, LLVMPointerType(vector_type, 0), "");
  107. LLVMValueRef v = LLVMBuildLoad2(p->builder, vector_type, vp, "");
  108. LLVMValueRef opv = nullptr;
  109. switch (op) {
  110. case Token_Xor:
  111. opv = LLVMBuildNot(p->builder, v, "");
  112. if (is_type_bit_set(elem_type)) {
  113. ExactValue ev_mask = exact_bit_set_all_set_mask(elem_type);
  114. lbValue mask = lb_const_value(p->module, elem_type, ev_mask);
  115. opv = LLVMBuildAnd(p->builder, opv, mask.value, "");
  116. }
  117. break;
  118. case Token_Sub:
  119. if (is_type_float(elem_type)) {
  120. opv = LLVMBuildFNeg(p->builder, v, "");
  121. } else {
  122. opv = LLVMBuildNeg(p->builder, v, "");
  123. }
  124. break;
  125. }
  126. if (opv != nullptr) {
  127. LLVMSetAlignment(res.value, cast(unsigned)lb_alignof(vector_type));
  128. LLVMValueRef res_ptr = LLVMBuildPointerCast(p->builder, res.value, LLVMPointerType(vector_type, 0), "");
  129. LLVMBuildStore(p->builder, opv, res_ptr);
  130. return lb_emit_conv(p, lb_emit_load(p, res), type);
  131. }
  132. }
  133. if (inline_array_arith) {
  134. // inline
  135. for (i32 i = 0; i < count; i++) {
  136. lbValue e = lb_emit_load(p, lb_emit_array_epi(p, val, i));
  137. lbValue z = lb_emit_unary_arith(p, op, e, elem_type);
  138. lb_emit_store(p, lb_emit_array_epi(p, res, i), z);
  139. }
  140. } else {
  141. auto loop_data = lb_loop_start(p, count, t_i32);
  142. lbValue e = lb_emit_load(p, lb_emit_array_ep(p, val, loop_data.idx));
  143. lbValue z = lb_emit_unary_arith(p, op, e, elem_type);
  144. lb_emit_store(p, lb_emit_array_ep(p, res, loop_data.idx), z);
  145. lb_loop_end(p, loop_data);
  146. }
  147. return lb_emit_load(p, res);
  148. }
  149. if (op == Token_Xor) {
  150. lbValue cmp = {};
  151. cmp.type = x.type;
  152. if (is_type_bit_set(x.type)) {
  153. ExactValue ev_mask = exact_bit_set_all_set_mask(x.type);
  154. lbValue mask = lb_const_value(p->module, x.type, ev_mask);
  155. cmp.value = LLVMBuildXor(p->builder, x.value, mask.value, "");
  156. } else {
  157. cmp.value = LLVMBuildNot(p->builder, x.value, "");
  158. }
  159. return lb_emit_conv(p, cmp, type);
  160. }
  161. if (op == Token_Not) {
  162. lbValue cmp = {};
  163. LLVMValueRef zero = LLVMConstInt(lb_type(p->module, x.type), 0, false);
  164. cmp.value = LLVMBuildICmp(p->builder, LLVMIntEQ, x.value, zero, "");
  165. cmp.type = t_llvm_bool;
  166. return lb_emit_conv(p, cmp, type);
  167. }
  168. if (op == Token_Sub && is_type_integer(type) && is_type_different_to_arch_endianness(type)) {
  169. Type *platform_type = integer_endian_type_to_platform_type(type);
  170. lbValue v = lb_emit_byte_swap(p, x, platform_type);
  171. lbValue res = {};
  172. res.value = LLVMBuildNeg(p->builder, v.value, "");
  173. res.type = platform_type;
  174. return lb_emit_byte_swap(p, res, type);
  175. }
  176. if (op == Token_Sub && is_type_float(type) && is_type_different_to_arch_endianness(type)) {
  177. Type *platform_type = integer_endian_type_to_platform_type(type);
  178. lbValue v = lb_emit_byte_swap(p, x, platform_type);
  179. lbValue res = {};
  180. res.value = LLVMBuildFNeg(p->builder, v.value, "");
  181. res.type = platform_type;
  182. return lb_emit_byte_swap(p, res, type);
  183. }
  184. lbValue res = {};
  185. switch (op) {
  186. case Token_Not: // Boolean not
  187. case Token_Xor: // Bitwise not
  188. res.value = LLVMBuildNot(p->builder, x.value, "");
  189. res.type = x.type;
  190. return res;
  191. case Token_Sub: // Number negation
  192. if (is_type_integer(x.type)) {
  193. res.value = LLVMBuildNeg(p->builder, x.value, "");
  194. } else if (is_type_float(x.type)) {
  195. res.value = LLVMBuildFNeg(p->builder, x.value, "");
  196. } else if (is_type_complex(x.type)) {
  197. LLVMValueRef v0 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 0, ""), "");
  198. LLVMValueRef v1 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 1, ""), "");
  199. lbAddr addr = lb_add_local_generated(p, x.type, false);
  200. LLVMTypeRef type = llvm_addr_type(p->module, addr.addr);
  201. LLVMBuildStore(p->builder, v0, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 0, ""));
  202. LLVMBuildStore(p->builder, v1, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 1, ""));
  203. return lb_addr_load(p, addr);
  204. } else if (is_type_quaternion(x.type)) {
  205. LLVMValueRef v0 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 0, ""), "");
  206. LLVMValueRef v1 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 1, ""), "");
  207. LLVMValueRef v2 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 2, ""), "");
  208. LLVMValueRef v3 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 3, ""), "");
  209. lbAddr addr = lb_add_local_generated(p, x.type, false);
  210. LLVMTypeRef type = llvm_addr_type(p->module, addr.addr);
  211. LLVMBuildStore(p->builder, v0, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 0, ""));
  212. LLVMBuildStore(p->builder, v1, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 1, ""));
  213. LLVMBuildStore(p->builder, v2, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 2, ""));
  214. LLVMBuildStore(p->builder, v3, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 3, ""));
  215. return lb_addr_load(p, addr);
  216. } else if (is_type_simd_vector(x.type)) {
  217. Type *elem = base_array_type(x.type);
  218. if (is_type_float(elem)) {
  219. res.value = LLVMBuildFNeg(p->builder, x.value, "");
  220. } else {
  221. res.value = LLVMBuildNeg(p->builder, x.value, "");
  222. }
  223. } else if (is_type_matrix(x.type)) {
  224. lbValue zero = {};
  225. zero.value = LLVMConstNull(lb_type(p->module, type));
  226. zero.type = type;
  227. return lb_emit_arith_matrix(p, Token_Sub, zero, x, type, true);
  228. } else {
  229. GB_PANIC("Unhandled type %s", type_to_string(x.type));
  230. }
  231. res.type = x.type;
  232. return res;
  233. }
  234. return res;
  235. }
  236. gb_internal bool lb_try_direct_vector_arith(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type, lbValue *res_) {
  237. GB_ASSERT(is_type_array_like(type));
  238. Type *elem_type = base_array_type(type);
  239. // NOTE(bill): Shift operations cannot be easily dealt with due to Odin's semantics
  240. if (op == Token_Shl || op == Token_Shr) {
  241. return false;
  242. }
  243. if (!LLVMIsALoadInst(lhs.value) || !LLVMIsALoadInst(rhs.value)) {
  244. return false;
  245. }
  246. lbValue lhs_ptr = {};
  247. lbValue rhs_ptr = {};
  248. lhs_ptr.value = LLVMGetOperand(lhs.value, 0);
  249. lhs_ptr.type = alloc_type_pointer(lhs.type);
  250. rhs_ptr.value = LLVMGetOperand(rhs.value, 0);
  251. rhs_ptr.type = alloc_type_pointer(rhs.type);
  252. LLVMTypeRef vector_type0 = nullptr;
  253. LLVMTypeRef vector_type1 = nullptr;
  254. if (lb_try_vector_cast(p->module, lhs_ptr, &vector_type0) &&
  255. lb_try_vector_cast(p->module, rhs_ptr, &vector_type1)) {
  256. GB_ASSERT(vector_type0 == vector_type1);
  257. LLVMTypeRef vector_type = vector_type0;
  258. Type *integral_type = base_type(elem_type);
  259. if (is_type_simd_vector(integral_type)) {
  260. integral_type = core_array_type(integral_type);
  261. }
  262. if (is_type_bit_set(integral_type)) {
  263. switch (op) {
  264. case Token_Add: op = Token_Or; break;
  265. case Token_Sub: op = Token_AndNot; break;
  266. }
  267. Type *u = bit_set_to_int(type);
  268. if (is_type_array(u)) {
  269. return false;
  270. }
  271. }
  272. LLVMValueRef lhs_vp = LLVMBuildPointerCast(p->builder, lhs_ptr.value, LLVMPointerType(vector_type, 0), "");
  273. LLVMValueRef rhs_vp = LLVMBuildPointerCast(p->builder, rhs_ptr.value, LLVMPointerType(vector_type, 0), "");
  274. LLVMValueRef x = LLVMBuildLoad2(p->builder, vector_type, lhs_vp, "");
  275. LLVMValueRef y = LLVMBuildLoad2(p->builder, vector_type, rhs_vp, "");
  276. LLVMValueRef z = nullptr;
  277. if (is_type_float(integral_type)) {
  278. switch (op) {
  279. case Token_Add:
  280. z = LLVMBuildFAdd(p->builder, x, y, "");
  281. break;
  282. case Token_Sub:
  283. z = LLVMBuildFSub(p->builder, x, y, "");
  284. break;
  285. case Token_Mul:
  286. z = LLVMBuildFMul(p->builder, x, y, "");
  287. break;
  288. case Token_Quo:
  289. z = LLVMBuildFDiv(p->builder, x, y, "");
  290. break;
  291. case Token_Mod:
  292. z = LLVMBuildFRem(p->builder, x, y, "");
  293. break;
  294. default:
  295. GB_PANIC("Unsupported vector operation %.*s", LIT(token_strings[op]));
  296. break;
  297. }
  298. } else {
  299. switch (op) {
  300. case Token_Add:
  301. z = LLVMBuildAdd(p->builder, x, y, "");
  302. break;
  303. case Token_Sub:
  304. z = LLVMBuildSub(p->builder, x, y, "");
  305. break;
  306. case Token_Mul:
  307. z = LLVMBuildMul(p->builder, x, y, "");
  308. break;
  309. case Token_Quo:
  310. if (is_type_unsigned(integral_type)) {
  311. z = LLVMBuildUDiv(p->builder, x, y, "");
  312. } else {
  313. z = LLVMBuildSDiv(p->builder, x, y, "");
  314. }
  315. break;
  316. case Token_Mod:
  317. if (is_type_unsigned(integral_type)) {
  318. z = LLVMBuildURem(p->builder, x, y, "");
  319. } else {
  320. z = LLVMBuildSRem(p->builder, x, y, "");
  321. }
  322. break;
  323. case Token_ModMod:
  324. if (is_type_unsigned(integral_type)) {
  325. z = LLVMBuildURem(p->builder, x, y, "");
  326. } else {
  327. LLVMValueRef a = LLVMBuildSRem(p->builder, x, y, "");
  328. LLVMValueRef b = LLVMBuildAdd(p->builder, a, y, "");
  329. z = LLVMBuildSRem(p->builder, b, y, "");
  330. }
  331. break;
  332. case Token_And:
  333. z = LLVMBuildAnd(p->builder, x, y, "");
  334. break;
  335. case Token_AndNot:
  336. z = LLVMBuildAnd(p->builder, x, LLVMBuildNot(p->builder, y, ""), "");
  337. break;
  338. case Token_Or:
  339. z = LLVMBuildOr(p->builder, x, y, "");
  340. break;
  341. case Token_Xor:
  342. z = LLVMBuildXor(p->builder, x, y, "");
  343. break;
  344. default:
  345. GB_PANIC("Unsupported vector operation");
  346. break;
  347. }
  348. }
  349. if (z != nullptr) {
  350. lbAddr res = lb_add_local_generated_temp(p, type, lb_alignof(vector_type));
  351. LLVMValueRef vp = LLVMBuildPointerCast(p->builder, res.addr.value, LLVMPointerType(vector_type, 0), "");
  352. LLVMBuildStore(p->builder, z, vp);
  353. lbValue v = lb_addr_load(p, res);
  354. if (res_) *res_ = v;
  355. return true;
  356. }
  357. }
  358. return false;
  359. }
  360. gb_internal lbValue lb_emit_arith_array(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type) {
  361. GB_ASSERT(is_type_array_like(lhs.type) || is_type_array_like(rhs.type));
  362. lhs = lb_emit_conv(p, lhs, type);
  363. rhs = lb_emit_conv(p, rhs, type);
  364. GB_ASSERT(is_type_array_like(type));
  365. Type *elem_type = base_array_type(type);
  366. i64 count = get_array_type_count(type);
  367. unsigned n = cast(unsigned)count;
  368. // NOTE(bill, 2021-06-12): Try to do a direct operation as a vector, if possible
  369. lbValue direct_vector_res = {};
  370. if (lb_try_direct_vector_arith(p, op, lhs, rhs, type, &direct_vector_res)) {
  371. return direct_vector_res;
  372. }
  373. bool inline_array_arith = lb_can_try_to_inline_array_arith(type);
  374. if (inline_array_arith) {
  375. auto dst_ptrs = slice_make<lbValue>(temporary_allocator(), n);
  376. auto a_loads = slice_make<lbValue>(temporary_allocator(), n);
  377. auto b_loads = slice_make<lbValue>(temporary_allocator(), n);
  378. auto c_ops = slice_make<lbValue>(temporary_allocator(), n);
  379. for (unsigned i = 0; i < n; i++) {
  380. a_loads[i].value = LLVMBuildExtractValue(p->builder, lhs.value, i, "");
  381. a_loads[i].type = elem_type;
  382. }
  383. for (unsigned i = 0; i < n; i++) {
  384. b_loads[i].value = LLVMBuildExtractValue(p->builder, rhs.value, i, "");
  385. b_loads[i].type = elem_type;
  386. }
  387. for (unsigned i = 0; i < n; i++) {
  388. c_ops[i] = lb_emit_arith(p, op, a_loads[i], b_loads[i], elem_type);
  389. }
  390. lbAddr res = lb_add_local_generated(p, type, false);
  391. for (unsigned i = 0; i < n; i++) {
  392. dst_ptrs[i] = lb_emit_array_epi(p, res.addr, i);
  393. }
  394. for (unsigned i = 0; i < n; i++) {
  395. lb_emit_store(p, dst_ptrs[i], c_ops[i]);
  396. }
  397. return lb_addr_load(p, res);
  398. } else {
  399. lbValue x = lb_address_from_load_or_generate_local(p, lhs);
  400. lbValue y = lb_address_from_load_or_generate_local(p, rhs);
  401. lbAddr res = lb_add_local_generated(p, type, false);
  402. auto loop_data = lb_loop_start(p, cast(isize)count, t_i32);
  403. lbValue a_ptr = lb_emit_array_ep(p, x, loop_data.idx);
  404. lbValue b_ptr = lb_emit_array_ep(p, y, loop_data.idx);
  405. lbValue dst_ptr = lb_emit_array_ep(p, res.addr, loop_data.idx);
  406. lbValue a = lb_emit_load(p, a_ptr);
  407. lbValue b = lb_emit_load(p, b_ptr);
  408. lbValue c = lb_emit_arith(p, op, a, b, elem_type);
  409. lb_emit_store(p, dst_ptr, c);
  410. lb_loop_end(p, loop_data);
  411. return lb_addr_load(p, res);
  412. }
  413. }
  414. gb_internal bool lb_is_matrix_simdable(Type *t) {
  415. Type *mt = base_type(t);
  416. GB_ASSERT(mt->kind == Type_Matrix);
  417. Type *elem = core_type(mt->Matrix.elem);
  418. if (is_type_complex(elem)) {
  419. return false;
  420. }
  421. if (is_type_different_to_arch_endianness(elem)) {
  422. return false;
  423. }
  424. switch (build_context.metrics.arch) {
  425. default:
  426. return false;
  427. case TargetArch_amd64:
  428. case TargetArch_arm64:
  429. break;
  430. }
  431. if (type_align_of(t) < 16) {
  432. // it's not aligned well enough to use the vector instructions
  433. return false;
  434. }
  435. if ((mt->Matrix.row_count & 1) ^ (mt->Matrix.column_count & 1)) {
  436. return false;
  437. }
  438. if (mt->Matrix.is_row_major) {
  439. // TODO(bill): make #row_major matrices work with SIMD
  440. return false;
  441. }
  442. if (elem->kind == Type_Basic) {
  443. switch (elem->Basic.kind) {
  444. case Basic_f16:
  445. case Basic_f16le:
  446. case Basic_f16be:
  447. switch (build_context.metrics.arch) {
  448. case TargetArch_amd64:
  449. return false;
  450. case TargetArch_arm64:
  451. // TODO(bill): determine when this is fine
  452. return true;
  453. case TargetArch_i386:
  454. case TargetArch_wasm32:
  455. case TargetArch_wasm64p32:
  456. return false;
  457. }
  458. }
  459. }
  460. return true;
  461. }
  462. gb_internal LLVMValueRef lb_matrix_to_vector(lbProcedure *p, lbValue matrix) {
  463. Type *mt = base_type(matrix.type);
  464. GB_ASSERT(mt->kind == Type_Matrix);
  465. LLVMTypeRef elem_type = lb_type(p->module, mt->Matrix.elem);
  466. unsigned total_count = cast(unsigned)matrix_type_total_internal_elems(mt);
  467. LLVMTypeRef total_matrix_type = LLVMVectorType(elem_type, total_count);
  468. #if 1
  469. LLVMValueRef ptr = lb_address_from_load_or_generate_local(p, matrix).value;
  470. LLVMValueRef matrix_vector_ptr = LLVMBuildPointerCast(p->builder, ptr, LLVMPointerType(total_matrix_type, 0), "");
  471. LLVMValueRef matrix_vector = LLVMBuildLoad2(p->builder, total_matrix_type, matrix_vector_ptr, "");
  472. LLVMSetAlignment(matrix_vector, cast(unsigned)type_align_of(mt));
  473. return matrix_vector;
  474. #else
  475. LLVMValueRef matrix_vector = LLVMBuildBitCast(p->builder, matrix.value, total_matrix_type, "");
  476. return matrix_vector;
  477. #endif
  478. }
  479. gb_internal LLVMValueRef lb_matrix_trimmed_vector_mask(lbProcedure *p, Type *mt) {
  480. mt = base_type(mt);
  481. GB_ASSERT(mt->kind == Type_Matrix);
  482. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  483. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  484. unsigned column_count = cast(unsigned)mt->Matrix.column_count;
  485. unsigned mask_elems_index = 0;
  486. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), row_count*column_count);
  487. for (unsigned j = 0; j < column_count; j++) {
  488. for (unsigned i = 0; i < row_count; i++) {
  489. unsigned offset = stride*j + i;
  490. mask_elems[mask_elems_index++] = lb_const_int(p->module, t_u32, offset).value;
  491. }
  492. }
  493. LLVMValueRef mask = LLVMConstVector(mask_elems.data, cast(unsigned)mask_elems.count);
  494. return mask;
  495. }
  496. gb_internal LLVMValueRef lb_matrix_to_trimmed_vector(lbProcedure *p, lbValue m) {
  497. LLVMValueRef vector = lb_matrix_to_vector(p, m);
  498. Type *mt = base_type(m.type);
  499. GB_ASSERT(mt->kind == Type_Matrix);
  500. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  501. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  502. if (stride == row_count) {
  503. return vector;
  504. }
  505. LLVMValueRef mask = lb_matrix_trimmed_vector_mask(p, mt);
  506. LLVMValueRef trimmed_vector = llvm_basic_shuffle(p, vector, mask);
  507. return trimmed_vector;
  508. }
  509. gb_internal lbValue lb_emit_matrix_tranpose(lbProcedure *p, lbValue m, Type *type) {
  510. if (is_type_array(m.type)) {
  511. i32 rank = type_math_rank(m.type);
  512. if (rank == 2) {
  513. lbAddr addr = lb_add_local_generated(p, type, false);
  514. lbValue dst = addr.addr;
  515. lbValue src = m;
  516. i32 n = cast(i32)get_array_type_count(m.type);
  517. i32 m = cast(i32)get_array_type_count(type);
  518. // m.type == [n][m]T
  519. // type == [m][n]T
  520. for (i32 j = 0; j < m; j++) {
  521. lbValue dst_col = lb_emit_struct_ep(p, dst, j);
  522. for (i32 i = 0; i < n; i++) {
  523. lbValue dst_row = lb_emit_struct_ep(p, dst_col, i);
  524. lbValue src_col = lb_emit_struct_ev(p, src, i);
  525. lbValue src_row = lb_emit_struct_ev(p, src_col, j);
  526. lb_emit_store(p, dst_row, src_row);
  527. }
  528. }
  529. return lb_addr_load(p, addr);
  530. }
  531. // no-op
  532. m.type = type;
  533. return m;
  534. }
  535. Type *mt = base_type(m.type);
  536. GB_ASSERT(mt->kind == Type_Matrix);
  537. if (lb_is_matrix_simdable(mt)) {
  538. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  539. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  540. unsigned column_count = cast(unsigned)mt->Matrix.column_count;
  541. auto rows = slice_make<LLVMValueRef>(permanent_allocator(), row_count);
  542. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  543. LLVMValueRef vector = lb_matrix_to_vector(p, m);
  544. for (unsigned i = 0; i < row_count; i++) {
  545. for (unsigned j = 0; j < column_count; j++) {
  546. unsigned offset = stride*j + i;
  547. mask_elems[j] = lb_const_int(p->module, t_u32, offset).value;
  548. }
  549. // transpose mask
  550. LLVMValueRef mask = LLVMConstVector(mask_elems.data, column_count);
  551. LLVMValueRef row = llvm_basic_shuffle(p, vector, mask);
  552. rows[i] = row;
  553. }
  554. lbAddr res = lb_add_local_generated(p, type, true);
  555. for_array(i, rows) {
  556. LLVMValueRef row = rows[i];
  557. lbValue dst_row_ptr = lb_emit_matrix_epi(p, res.addr, 0, i);
  558. LLVMValueRef ptr = dst_row_ptr.value;
  559. ptr = LLVMBuildPointerCast(p->builder, ptr, LLVMPointerType(LLVMTypeOf(row), 0), "");
  560. LLVMBuildStore(p->builder, row, ptr);
  561. }
  562. return lb_addr_load(p, res);
  563. }
  564. lbAddr res = lb_add_local_generated(p, type, true);
  565. i64 row_count = mt->Matrix.row_count;
  566. i64 column_count = mt->Matrix.column_count;
  567. for (i64 j = 0; j < column_count; j++) {
  568. for (i64 i = 0; i < row_count; i++) {
  569. lbValue src = lb_emit_matrix_ev(p, m, i, j);
  570. lbValue dst = lb_emit_matrix_epi(p, res.addr, j, i);
  571. lb_emit_store(p, dst, src);
  572. }
  573. }
  574. return lb_addr_load(p, res);
  575. }
  576. gb_internal lbValue lb_matrix_cast_vector_to_type(lbProcedure *p, LLVMValueRef vector, Type *type) {
  577. lbAddr res = lb_add_local_generated(p, type, true);
  578. LLVMValueRef res_ptr = res.addr.value;
  579. unsigned alignment = cast(unsigned)gb_max(type_align_of(type), lb_alignof(LLVMTypeOf(vector)));
  580. LLVMSetAlignment(res_ptr, alignment);
  581. res_ptr = LLVMBuildPointerCast(p->builder, res_ptr, LLVMPointerType(LLVMTypeOf(vector), 0), "");
  582. LLVMBuildStore(p->builder, vector, res_ptr);
  583. return lb_addr_load(p, res);
  584. }
  585. gb_internal lbValue lb_emit_matrix_flatten(lbProcedure *p, lbValue m, Type *type) {
  586. if (is_type_array(m.type)) {
  587. // no-op
  588. m.type = type;
  589. return m;
  590. }
  591. Type *mt = base_type(m.type);
  592. GB_ASSERT(mt->kind == Type_Matrix);
  593. lbAddr res = lb_add_local_generated(p, type, true);
  594. GB_ASSERT(type_size_of(type) == type_size_of(m.type));
  595. lbValue m_ptr = lb_address_from_load_or_generate_local(p, m);
  596. lbValue n = lb_const_int(p->module, t_int, type_size_of(type));
  597. lb_mem_copy_non_overlapping(p, res.addr, m_ptr, n);
  598. // i64 row_count = mt->Matrix.row_count;
  599. // i64 column_count = mt->Matrix.column_count;
  600. // TEMPORARY_ALLOCATOR_GUARD();
  601. // auto srcs = array_make<lbValue>(temporary_allocator(), 0, row_count*column_count);
  602. // auto dsts = array_make<lbValue>(temporary_allocator(), 0, row_count*column_count);
  603. // for (i64 j = 0; j < column_count; j++) {
  604. // for (i64 i = 0; i < row_count; i++) {
  605. // lbValue src = lb_emit_matrix_ev(p, m, i, j);
  606. // array_add(&srcs, src);
  607. // }
  608. // }
  609. // for (i64 j = 0; j < column_count; j++) {
  610. // for (i64 i = 0; i < row_count; i++) {
  611. // lbValue dst = lb_emit_array_epi(p, res.addr, i + j*row_count);
  612. // array_add(&dsts, dst);
  613. // }
  614. // }
  615. // GB_ASSERT(srcs.count == dsts.count);
  616. // for_array(i, srcs) {
  617. // lb_emit_store(p, dsts[i], srcs[i]);
  618. // }
  619. return lb_addr_load(p, res);
  620. }
  621. gb_internal lbValue lb_emit_outer_product(lbProcedure *p, lbValue a, lbValue b, Type *type) {
  622. Type *mt = base_type(type);
  623. Type *at = base_type(a.type);
  624. Type *bt = base_type(b.type);
  625. GB_ASSERT(mt->kind == Type_Matrix);
  626. GB_ASSERT(at->kind == Type_Array);
  627. GB_ASSERT(bt->kind == Type_Array);
  628. i64 row_count = mt->Matrix.row_count;
  629. i64 column_count = mt->Matrix.column_count;
  630. GB_ASSERT(row_count == at->Array.count);
  631. GB_ASSERT(column_count == bt->Array.count);
  632. lbAddr res = lb_add_local_generated(p, type, true);
  633. for (i64 j = 0; j < column_count; j++) {
  634. for (i64 i = 0; i < row_count; i++) {
  635. lbValue x = lb_emit_struct_ev(p, a, cast(i32)i);
  636. lbValue y = lb_emit_struct_ev(p, b, cast(i32)j);
  637. lbValue src = lb_emit_arith(p, Token_Mul, x, y, mt->Matrix.elem);
  638. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  639. lb_emit_store(p, dst, src);
  640. }
  641. }
  642. return lb_addr_load(p, res);
  643. }
  644. gb_internal lbValue lb_emit_matrix_mul(lbProcedure *p, lbValue lhs, lbValue rhs, Type *type) {
  645. // TODO(bill): Handle edge case for f16 types on x86(-64) platforms
  646. Type *xt = base_type(lhs.type);
  647. Type *yt = base_type(rhs.type);
  648. GB_ASSERT(is_type_matrix(type));
  649. GB_ASSERT(is_type_matrix(xt));
  650. GB_ASSERT(is_type_matrix(yt));
  651. GB_ASSERT(xt->Matrix.column_count == yt->Matrix.row_count);
  652. GB_ASSERT(are_types_identical(xt->Matrix.elem, yt->Matrix.elem));
  653. GB_ASSERT(xt->Matrix.is_row_major == yt->Matrix.is_row_major);
  654. Type *elem = xt->Matrix.elem;
  655. unsigned outer_rows = cast(unsigned)xt->Matrix.row_count;
  656. unsigned inner = cast(unsigned)xt->Matrix.column_count;
  657. unsigned outer_columns = cast(unsigned)yt->Matrix.column_count;
  658. if (!xt->Matrix.is_row_major && lb_is_matrix_simdable(xt)) {
  659. unsigned x_stride = cast(unsigned)matrix_type_stride_in_elems(xt);
  660. unsigned y_stride = cast(unsigned)matrix_type_stride_in_elems(yt);
  661. auto x_rows = slice_make<LLVMValueRef>(permanent_allocator(), outer_rows);
  662. auto y_columns = slice_make<LLVMValueRef>(permanent_allocator(), outer_columns);
  663. LLVMValueRef x_vector = lb_matrix_to_vector(p, lhs);
  664. LLVMValueRef y_vector = lb_matrix_to_vector(p, rhs);
  665. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), inner);
  666. for (unsigned i = 0; i < outer_rows; i++) {
  667. for (unsigned j = 0; j < inner; j++) {
  668. unsigned offset = x_stride*j + i;
  669. mask_elems[j] = lb_const_int(p->module, t_u32, offset).value;
  670. }
  671. // transpose mask
  672. LLVMValueRef mask = LLVMConstVector(mask_elems.data, inner);
  673. LLVMValueRef row = llvm_basic_shuffle(p, x_vector, mask);
  674. x_rows[i] = row;
  675. }
  676. for (unsigned i = 0; i < outer_columns; i++) {
  677. LLVMValueRef mask = llvm_mask_iota(p->module, y_stride*i, inner);
  678. LLVMValueRef column = llvm_basic_shuffle(p, y_vector, mask);
  679. y_columns[i] = column;
  680. }
  681. lbAddr res = lb_add_local_generated(p, type, true);
  682. for_array(i, x_rows) {
  683. LLVMValueRef x_row = x_rows[i];
  684. for_array(j, y_columns) {
  685. LLVMValueRef y_column = y_columns[j];
  686. LLVMValueRef elem = llvm_vector_dot(p, x_row, y_column);
  687. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  688. LLVMBuildStore(p->builder, elem, dst.value);
  689. }
  690. }
  691. return lb_addr_load(p, res);
  692. }
  693. if (!xt->Matrix.is_row_major) {
  694. lbAddr res = lb_add_local_generated(p, type, true);
  695. auto inners = slice_make<lbValue[2]>(permanent_allocator(), inner);
  696. for (unsigned j = 0; j < outer_columns; j++) {
  697. for (unsigned i = 0; i < outer_rows; i++) {
  698. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  699. for (unsigned k = 0; k < inner; k++) {
  700. inners[k][0] = lb_emit_matrix_ev(p, lhs, i, k);
  701. inners[k][1] = lb_emit_matrix_ev(p, rhs, k, j);
  702. }
  703. lbValue sum = lb_const_nil(p->module, elem);
  704. for (unsigned k = 0; k < inner; k++) {
  705. lbValue a = inners[k][0];
  706. lbValue b = inners[k][1];
  707. sum = lb_emit_mul_add(p, a, b, sum, elem);
  708. }
  709. lb_emit_store(p, dst, sum);
  710. }
  711. }
  712. return lb_addr_load(p, res);
  713. } else {
  714. lbAddr res = lb_add_local_generated(p, type, true);
  715. auto inners = slice_make<lbValue[2]>(permanent_allocator(), inner);
  716. for (unsigned i = 0; i < outer_rows; i++) {
  717. for (unsigned j = 0; j < outer_columns; j++) {
  718. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  719. for (unsigned k = 0; k < inner; k++) {
  720. inners[k][0] = lb_emit_matrix_ev(p, lhs, i, k);
  721. inners[k][1] = lb_emit_matrix_ev(p, rhs, k, j);
  722. }
  723. lbValue sum = lb_const_nil(p->module, elem);
  724. for (unsigned k = 0; k < inner; k++) {
  725. lbValue a = inners[k][0];
  726. lbValue b = inners[k][1];
  727. sum = lb_emit_mul_add(p, a, b, sum, elem);
  728. }
  729. lb_emit_store(p, dst, sum);
  730. }
  731. }
  732. return lb_addr_load(p, res);
  733. }
  734. }
  735. gb_internal lbValue lb_emit_matrix_mul_vector(lbProcedure *p, lbValue lhs, lbValue rhs, Type *type) {
  736. // TODO(bill): Handle edge case for f16 types on x86(-64) platforms
  737. Type *mt = base_type(lhs.type);
  738. Type *vt = base_type(rhs.type);
  739. GB_ASSERT(is_type_matrix(mt));
  740. GB_ASSERT(is_type_array_like(vt));
  741. i64 vector_count = get_array_type_count(vt);
  742. GB_ASSERT(mt->Matrix.column_count == vector_count);
  743. GB_ASSERT(are_types_identical(mt->Matrix.elem, base_array_type(vt)));
  744. Type *elem = mt->Matrix.elem;
  745. if (!mt->Matrix.is_row_major && lb_is_matrix_simdable(mt)) {
  746. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  747. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  748. unsigned column_count = cast(unsigned)mt->Matrix.column_count;
  749. auto m_columns = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  750. auto v_rows = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  751. LLVMValueRef matrix_vector = lb_matrix_to_vector(p, lhs);
  752. for (unsigned column_index = 0; column_index < column_count; column_index++) {
  753. LLVMValueRef mask = llvm_mask_iota(p->module, stride*column_index, row_count);
  754. LLVMValueRef column = llvm_basic_shuffle(p, matrix_vector, mask);
  755. m_columns[column_index] = column;
  756. }
  757. for (unsigned row_index = 0; row_index < column_count; row_index++) {
  758. LLVMValueRef value = lb_emit_struct_ev(p, rhs, row_index).value;
  759. LLVMValueRef row = llvm_vector_broadcast(p, value, row_count);
  760. v_rows[row_index] = row;
  761. }
  762. GB_ASSERT(column_count > 0);
  763. LLVMValueRef vector = nullptr;
  764. for (i64 i = 0; i < column_count; i++) {
  765. if (i == 0) {
  766. vector = llvm_vector_mul(p, m_columns[i], v_rows[i]);
  767. } else {
  768. vector = llvm_vector_mul_add(p, m_columns[i], v_rows[i], vector);
  769. }
  770. }
  771. return lb_matrix_cast_vector_to_type(p, vector, type);
  772. }
  773. lbAddr res = lb_add_local_generated(p, type, true);
  774. for (i64 i = 0; i < mt->Matrix.row_count; i++) {
  775. for (i64 j = 0; j < mt->Matrix.column_count; j++) {
  776. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, 0);
  777. lbValue d0 = lb_emit_load(p, dst);
  778. lbValue a = lb_emit_matrix_ev(p, lhs, i, j);
  779. lbValue b = lb_emit_struct_ev(p, rhs, cast(i32)j);
  780. lbValue c = lb_emit_mul_add(p, a, b, d0, elem);
  781. lb_emit_store(p, dst, c);
  782. }
  783. }
  784. return lb_addr_load(p, res);
  785. }
  786. gb_internal lbValue lb_emit_vector_mul_matrix(lbProcedure *p, lbValue lhs, lbValue rhs, Type *type) {
  787. // TODO(bill): Handle edge case for f16 types on x86(-64) platforms
  788. Type *mt = base_type(rhs.type);
  789. Type *vt = base_type(lhs.type);
  790. GB_ASSERT(is_type_matrix(mt));
  791. GB_ASSERT(is_type_array_like(vt));
  792. i64 vector_count = get_array_type_count(vt);
  793. GB_ASSERT(vector_count == mt->Matrix.row_count);
  794. GB_ASSERT(are_types_identical(mt->Matrix.elem, base_array_type(vt)));
  795. Type *elem = mt->Matrix.elem;
  796. if (!mt->Matrix.is_row_major && lb_is_matrix_simdable(mt)) {
  797. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  798. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  799. unsigned column_count = cast(unsigned)mt->Matrix.column_count; gb_unused(column_count);
  800. auto m_columns = slice_make<LLVMValueRef>(permanent_allocator(), row_count);
  801. auto v_rows = slice_make<LLVMValueRef>(permanent_allocator(), row_count);
  802. LLVMValueRef matrix_vector = lb_matrix_to_vector(p, rhs);
  803. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  804. for (unsigned row_index = 0; row_index < row_count; row_index++) {
  805. for (unsigned column_index = 0; column_index < column_count; column_index++) {
  806. unsigned offset = row_index + column_index*stride;
  807. mask_elems[column_index] = lb_const_int(p->module, t_u32, offset).value;
  808. }
  809. // transpose mask
  810. LLVMValueRef mask = LLVMConstVector(mask_elems.data, column_count);
  811. LLVMValueRef column = llvm_basic_shuffle(p, matrix_vector, mask);
  812. m_columns[row_index] = column;
  813. }
  814. for (unsigned column_index = 0; column_index < row_count; column_index++) {
  815. LLVMValueRef value = lb_emit_struct_ev(p, lhs, column_index).value;
  816. LLVMValueRef row = llvm_vector_broadcast(p, value, column_count);
  817. v_rows[column_index] = row;
  818. }
  819. GB_ASSERT(row_count > 0);
  820. LLVMValueRef vector = nullptr;
  821. for (i64 i = 0; i < row_count; i++) {
  822. if (i == 0) {
  823. vector = llvm_vector_mul(p, v_rows[i], m_columns[i]);
  824. } else {
  825. vector = llvm_vector_mul_add(p, v_rows[i], m_columns[i], vector);
  826. }
  827. }
  828. lbAddr res = lb_add_local_generated(p, type, true);
  829. LLVMValueRef res_ptr = res.addr.value;
  830. unsigned alignment = cast(unsigned)gb_max(type_align_of(type), lb_alignof(LLVMTypeOf(vector)));
  831. LLVMSetAlignment(res_ptr, alignment);
  832. res_ptr = LLVMBuildPointerCast(p->builder, res_ptr, LLVMPointerType(LLVMTypeOf(vector), 0), "");
  833. LLVMBuildStore(p->builder, vector, res_ptr);
  834. return lb_addr_load(p, res);
  835. }
  836. lbAddr res = lb_add_local_generated(p, type, true);
  837. for (i64 j = 0; j < mt->Matrix.column_count; j++) {
  838. for (i64 k = 0; k < mt->Matrix.row_count; k++) {
  839. lbValue dst = lb_emit_matrix_epi(p, res.addr, 0, j);
  840. lbValue d0 = lb_emit_load(p, dst);
  841. lbValue a = lb_emit_struct_ev(p, lhs, cast(i32)k);
  842. lbValue b = lb_emit_matrix_ev(p, rhs, k, j);
  843. lbValue c = lb_emit_mul_add(p, a, b, d0, elem);
  844. lb_emit_store(p, dst, c);
  845. }
  846. }
  847. return lb_addr_load(p, res);
  848. }
  849. gb_internal lbValue lb_emit_arith_matrix(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type, bool component_wise) {
  850. GB_ASSERT(is_type_matrix(lhs.type) || is_type_matrix(rhs.type));
  851. if (op == Token_Mul && !component_wise) {
  852. Type *xt = base_type(lhs.type);
  853. Type *yt = base_type(rhs.type);
  854. if (xt->kind == Type_Matrix) {
  855. if (yt->kind == Type_Matrix) {
  856. return lb_emit_matrix_mul(p, lhs, rhs, type);
  857. } else if (is_type_array_like(yt)) {
  858. return lb_emit_matrix_mul_vector(p, lhs, rhs, type);
  859. }
  860. } else if (is_type_array_like(xt)) {
  861. GB_ASSERT(yt->kind == Type_Matrix);
  862. return lb_emit_vector_mul_matrix(p, lhs, rhs, type);
  863. } else {
  864. GB_ASSERT(xt->kind == Type_Basic);
  865. GB_ASSERT(yt->kind == Type_Matrix);
  866. GB_ASSERT(is_type_matrix(type));
  867. Type *array_type = alloc_type_array(yt->Matrix.elem, matrix_type_total_internal_elems(yt));
  868. GB_ASSERT(type_size_of(array_type) == type_size_of(yt));
  869. lbValue array_lhs = lb_emit_conv(p, lhs, array_type);
  870. lbValue array_rhs = rhs;
  871. array_rhs.type = array_type;
  872. lbValue array = lb_emit_arith(p, op, array_lhs, array_rhs, array_type);
  873. array.type = type;
  874. return array;
  875. }
  876. } else {
  877. if (is_type_matrix(lhs.type)) {
  878. rhs = lb_emit_conv(p, rhs, lhs.type);
  879. } else {
  880. lhs = lb_emit_conv(p, lhs, rhs.type);
  881. }
  882. Type *xt = base_type(lhs.type);
  883. Type *yt = base_type(rhs.type);
  884. GB_ASSERT_MSG(are_types_identical(xt, yt), "%s %.*s %s", type_to_string(lhs.type), LIT(token_strings[op]), type_to_string(rhs.type));
  885. GB_ASSERT(xt->kind == Type_Matrix);
  886. // element-wise arithmetic
  887. // pretend it is an array
  888. lbValue array_lhs = lhs;
  889. lbValue array_rhs = rhs;
  890. Type *array_type = alloc_type_array(xt->Matrix.elem, matrix_type_total_internal_elems(xt));
  891. GB_ASSERT(type_size_of(array_type) == type_size_of(xt));
  892. array_lhs.type = array_type;
  893. array_rhs.type = array_type;
  894. if (token_is_comparison(op)) {
  895. lbValue res = lb_emit_comp(p, op, array_lhs, array_rhs);
  896. return lb_emit_conv(p, res, type);
  897. } else {
  898. lbValue array = lb_emit_arith(p, op, array_lhs, array_rhs, array_type);
  899. array.type = type;
  900. return array;
  901. }
  902. }
  903. GB_PANIC("TODO: lb_emit_arith_matrix");
  904. return {};
  905. }
  906. gb_internal lbValue lb_emit_arith(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type) {
  907. if (is_type_array_like(lhs.type) || is_type_array_like(rhs.type)) {
  908. return lb_emit_arith_array(p, op, lhs, rhs, type);
  909. } else if (is_type_matrix(lhs.type) || is_type_matrix(rhs.type)) {
  910. return lb_emit_arith_matrix(p, op, lhs, rhs, type, false);
  911. } else if (is_type_complex(type)) {
  912. lhs = lb_emit_conv(p, lhs, type);
  913. rhs = lb_emit_conv(p, rhs, type);
  914. Type *ft = base_complex_elem_type(type);
  915. if (op == Token_Quo) {
  916. TEMPORARY_ALLOCATOR_GUARD();
  917. auto args = array_make<lbValue>(temporary_allocator(), 2);
  918. args[0] = lhs;
  919. args[1] = rhs;
  920. switch (type_size_of(ft)) {
  921. case 2: return lb_emit_runtime_call(p, "quo_complex32", args);
  922. case 4: return lb_emit_runtime_call(p, "quo_complex64", args);
  923. case 8: return lb_emit_runtime_call(p, "quo_complex128", args);
  924. default: GB_PANIC("Unknown float type"); break;
  925. }
  926. }
  927. lbAddr res = lb_add_local_generated(p, type, false); // NOTE: initialized in full later
  928. lbValue a = lb_emit_struct_ev(p, lhs, 0);
  929. lbValue b = lb_emit_struct_ev(p, lhs, 1);
  930. lbValue c = lb_emit_struct_ev(p, rhs, 0);
  931. lbValue d = lb_emit_struct_ev(p, rhs, 1);
  932. lbValue real = {};
  933. lbValue imag = {};
  934. switch (op) {
  935. case Token_Add:
  936. case Token_Sub:
  937. if (type_size_of(ft) == 2) {
  938. a = lb_emit_conv(p, a, t_f32);
  939. b = lb_emit_conv(p, b, t_f32);
  940. c = lb_emit_conv(p, c, t_f32);
  941. d = lb_emit_conv(p, d, t_f32);
  942. real = lb_emit_arith(p, op, a, c, t_f32);
  943. imag = lb_emit_arith(p, op, b, d, t_f32);
  944. real = lb_emit_conv(p, real, ft);
  945. imag = lb_emit_conv(p, imag, ft);
  946. } else {
  947. real = lb_emit_arith(p, op, a, c, ft);
  948. imag = lb_emit_arith(p, op, b, d, ft);
  949. }
  950. break;
  951. case Token_Mul: {
  952. lbValue x = lb_emit_arith(p, Token_Mul, a, c, ft);
  953. lbValue y = lb_emit_arith(p, Token_Mul, b, d, ft);
  954. real = lb_emit_arith(p, Token_Sub, x, y, ft);
  955. lbValue z = lb_emit_arith(p, Token_Mul, b, c, ft);
  956. lbValue w = lb_emit_arith(p, Token_Mul, a, d, ft);
  957. imag = lb_emit_arith(p, Token_Add, z, w, ft);
  958. break;
  959. }
  960. }
  961. lb_emit_store(p, lb_emit_struct_ep(p, res.addr, 0), real);
  962. lb_emit_store(p, lb_emit_struct_ep(p, res.addr, 1), imag);
  963. return lb_addr_load(p, res);
  964. } else if (is_type_quaternion(type)) {
  965. lhs = lb_emit_conv(p, lhs, type);
  966. rhs = lb_emit_conv(p, rhs, type);
  967. Type *ft = base_complex_elem_type(type);
  968. if (op == Token_Add || op == Token_Sub) {
  969. Type *immediate_type = ft;
  970. if (type_size_of(ft) == 2) {
  971. immediate_type = t_f32;
  972. }
  973. lbAddr res = lb_add_local_generated(p, type, false); // NOTE: initialized in full later
  974. lbValue x0 = lb_emit_struct_ev(p, lhs, 0);
  975. lbValue x1 = lb_emit_struct_ev(p, lhs, 1);
  976. lbValue x2 = lb_emit_struct_ev(p, lhs, 2);
  977. lbValue x3 = lb_emit_struct_ev(p, lhs, 3);
  978. lbValue y0 = lb_emit_struct_ev(p, rhs, 0);
  979. lbValue y1 = lb_emit_struct_ev(p, rhs, 1);
  980. lbValue y2 = lb_emit_struct_ev(p, rhs, 2);
  981. lbValue y3 = lb_emit_struct_ev(p, rhs, 3);
  982. if (immediate_type != ft) {
  983. x0 = lb_emit_conv(p, x0, immediate_type);
  984. x1 = lb_emit_conv(p, x1, immediate_type);
  985. x2 = lb_emit_conv(p, x2, immediate_type);
  986. x3 = lb_emit_conv(p, x3, immediate_type);
  987. y0 = lb_emit_conv(p, y0, immediate_type);
  988. y1 = lb_emit_conv(p, y1, immediate_type);
  989. y2 = lb_emit_conv(p, y2, immediate_type);
  990. y3 = lb_emit_conv(p, y3, immediate_type);
  991. }
  992. lbValue z0 = lb_emit_arith(p, op, x0, y0, immediate_type);
  993. lbValue z1 = lb_emit_arith(p, op, x1, y1, immediate_type);
  994. lbValue z2 = lb_emit_arith(p, op, x2, y2, immediate_type);
  995. lbValue z3 = lb_emit_arith(p, op, x3, y3, immediate_type);
  996. lbValue d0 = lb_emit_struct_ep(p, res.addr, 0);
  997. lbValue d1 = lb_emit_struct_ep(p, res.addr, 1);
  998. lbValue d2 = lb_emit_struct_ep(p, res.addr, 2);
  999. lbValue d3 = lb_emit_struct_ep(p, res.addr, 3);
  1000. if (immediate_type != ft) {
  1001. d0 = lb_emit_conv(p, d0, ft);
  1002. d1 = lb_emit_conv(p, d1, ft);
  1003. d2 = lb_emit_conv(p, d2, ft);
  1004. d3 = lb_emit_conv(p, d3, ft);
  1005. }
  1006. lb_emit_store(p, d0, z0);
  1007. lb_emit_store(p, d1, z1);
  1008. lb_emit_store(p, d2, z2);
  1009. lb_emit_store(p, d3, z3);
  1010. return lb_addr_load(p, res);
  1011. } else if (op == Token_Mul) {
  1012. TEMPORARY_ALLOCATOR_GUARD();
  1013. auto args = array_make<lbValue>(temporary_allocator(), 2);
  1014. args[0] = lhs;
  1015. args[1] = rhs;
  1016. switch (8*type_size_of(ft)) {
  1017. case 16: return lb_emit_runtime_call(p, "mul_quaternion64", args);
  1018. case 32: return lb_emit_runtime_call(p, "mul_quaternion128", args);
  1019. case 64: return lb_emit_runtime_call(p, "mul_quaternion256", args);
  1020. default: GB_PANIC("Unknown float type"); break;
  1021. }
  1022. } else if (op == Token_Quo) {
  1023. TEMPORARY_ALLOCATOR_GUARD();
  1024. auto args = array_make<lbValue>(temporary_allocator(), 2);
  1025. args[0] = lhs;
  1026. args[1] = rhs;
  1027. switch (8*type_size_of(ft)) {
  1028. case 16: return lb_emit_runtime_call(p, "quo_quaternion64", args);
  1029. case 32: return lb_emit_runtime_call(p, "quo_quaternion128", args);
  1030. case 64: return lb_emit_runtime_call(p, "quo_quaternion256", args);
  1031. default: GB_PANIC("Unknown float type"); break;
  1032. }
  1033. }
  1034. }
  1035. lhs = lb_emit_conv(p, lhs, type);
  1036. rhs = lb_emit_conv(p, rhs, type);
  1037. if (is_type_integer(type) && is_type_different_to_arch_endianness(type)) {
  1038. switch (op) {
  1039. case Token_AndNot:
  1040. case Token_And:
  1041. case Token_Or:
  1042. case Token_Xor:
  1043. goto handle_op;
  1044. }
  1045. Type *platform_type = integer_endian_type_to_platform_type(type);
  1046. lbValue x = lb_emit_byte_swap(p, lhs, integer_endian_type_to_platform_type(lhs.type));
  1047. lbValue y = lb_emit_byte_swap(p, rhs, integer_endian_type_to_platform_type(rhs.type));
  1048. lbValue res = lb_emit_arith(p, op, x, y, platform_type);
  1049. return lb_emit_byte_swap(p, res, type);
  1050. }
  1051. if (is_type_float(type) && is_type_different_to_arch_endianness(type)) {
  1052. Type *platform_type = integer_endian_type_to_platform_type(type);
  1053. lbValue x = lb_emit_conv(p, lhs, integer_endian_type_to_platform_type(lhs.type));
  1054. lbValue y = lb_emit_conv(p, rhs, integer_endian_type_to_platform_type(rhs.type));
  1055. lbValue res = lb_emit_arith(p, op, x, y, platform_type);
  1056. return lb_emit_byte_swap(p, res, type);
  1057. }
  1058. handle_op:;
  1059. lbValue res = {};
  1060. res.type = type;
  1061. // NOTE(bill): Bit Set Aliases for + and -
  1062. if (is_type_bit_set(type)) {
  1063. switch (op) {
  1064. case Token_Add: op = Token_Or; break;
  1065. case Token_Sub: op = Token_AndNot; break;
  1066. }
  1067. Type *u = bit_set_to_int(type);
  1068. if (is_type_array(u)) {
  1069. lhs.type = u;
  1070. rhs.type = u;
  1071. res = lb_emit_arith(p, op, lhs, rhs, u);
  1072. res.type = type;
  1073. return res;
  1074. }
  1075. }
  1076. Type *integral_type = type;
  1077. if (is_type_simd_vector(integral_type)) {
  1078. integral_type = core_array_type(integral_type);
  1079. }
  1080. switch (op) {
  1081. case Token_Add:
  1082. if (is_type_float(integral_type)) {
  1083. res.value = LLVMBuildFAdd(p->builder, lhs.value, rhs.value, "");
  1084. return res;
  1085. }
  1086. res.value = LLVMBuildAdd(p->builder, lhs.value, rhs.value, "");
  1087. return res;
  1088. case Token_Sub:
  1089. if (is_type_float(integral_type)) {
  1090. res.value = LLVMBuildFSub(p->builder, lhs.value, rhs.value, "");
  1091. return res;
  1092. }
  1093. res.value = LLVMBuildSub(p->builder, lhs.value, rhs.value, "");
  1094. return res;
  1095. case Token_Mul:
  1096. if (is_type_float(integral_type)) {
  1097. res.value = LLVMBuildFMul(p->builder, lhs.value, rhs.value, "");
  1098. return res;
  1099. }
  1100. res.value = LLVMBuildMul(p->builder, lhs.value, rhs.value, "");
  1101. return res;
  1102. case Token_Quo:
  1103. if (is_type_float(integral_type)) {
  1104. res.value = LLVMBuildFDiv(p->builder, lhs.value, rhs.value, "");
  1105. return res;
  1106. } else if (is_type_unsigned(integral_type)) {
  1107. res.value = LLVMBuildUDiv(p->builder, lhs.value, rhs.value, "");
  1108. return res;
  1109. }
  1110. res.value = LLVMBuildSDiv(p->builder, lhs.value, rhs.value, "");
  1111. return res;
  1112. case Token_Mod:
  1113. if (is_type_float(integral_type)) {
  1114. res.value = LLVMBuildFRem(p->builder, lhs.value, rhs.value, "");
  1115. return res;
  1116. } else if (is_type_unsigned(integral_type)) {
  1117. res.value = LLVMBuildURem(p->builder, lhs.value, rhs.value, "");
  1118. return res;
  1119. }
  1120. res.value = LLVMBuildSRem(p->builder, lhs.value, rhs.value, "");
  1121. return res;
  1122. case Token_ModMod:
  1123. if (is_type_unsigned(integral_type)) {
  1124. res.value = LLVMBuildURem(p->builder, lhs.value, rhs.value, "");
  1125. return res;
  1126. } else {
  1127. LLVMValueRef a = LLVMBuildSRem(p->builder, lhs.value, rhs.value, "");
  1128. LLVMValueRef b = LLVMBuildAdd(p->builder, a, rhs.value, "");
  1129. LLVMValueRef c = LLVMBuildSRem(p->builder, b, rhs.value, "");
  1130. res.value = c;
  1131. return res;
  1132. }
  1133. case Token_And:
  1134. res.value = LLVMBuildAnd(p->builder, lhs.value, rhs.value, "");
  1135. return res;
  1136. case Token_Or:
  1137. res.value = LLVMBuildOr(p->builder, lhs.value, rhs.value, "");
  1138. return res;
  1139. case Token_Xor:
  1140. res.value = LLVMBuildXor(p->builder, lhs.value, rhs.value, "");
  1141. return res;
  1142. case Token_Shl:
  1143. {
  1144. rhs = lb_emit_conv(p, rhs, lhs.type);
  1145. LLVMValueRef lhsval = lhs.value;
  1146. LLVMValueRef bits = rhs.value;
  1147. LLVMValueRef bit_size = LLVMConstInt(lb_type(p->module, rhs.type), 8*type_size_of(lhs.type), false);
  1148. LLVMValueRef width_test = LLVMBuildICmp(p->builder, LLVMIntULT, bits, bit_size, "");
  1149. res.value = LLVMBuildShl(p->builder, lhsval, bits, "");
  1150. LLVMValueRef zero = LLVMConstNull(lb_type(p->module, lhs.type));
  1151. res.value = LLVMBuildSelect(p->builder, width_test, res.value, zero, "");
  1152. return res;
  1153. }
  1154. case Token_Shr:
  1155. {
  1156. rhs = lb_emit_conv(p, rhs, lhs.type);
  1157. LLVMValueRef lhsval = lhs.value;
  1158. LLVMValueRef bits = rhs.value;
  1159. bool is_unsigned = is_type_unsigned(integral_type);
  1160. LLVMValueRef bit_size = LLVMConstInt(lb_type(p->module, rhs.type), 8*type_size_of(lhs.type), false);
  1161. LLVMValueRef width_test = LLVMBuildICmp(p->builder, LLVMIntULT, bits, bit_size, "");
  1162. if (is_unsigned) {
  1163. res.value = LLVMBuildLShr(p->builder, lhsval, bits, "");
  1164. } else {
  1165. res.value = LLVMBuildAShr(p->builder, lhsval, bits, "");
  1166. }
  1167. LLVMValueRef zero = LLVMConstNull(lb_type(p->module, lhs.type));
  1168. res.value = LLVMBuildSelect(p->builder, width_test, res.value, zero, "");
  1169. return res;
  1170. }
  1171. case Token_AndNot:
  1172. {
  1173. LLVMValueRef new_rhs = LLVMBuildNot(p->builder, rhs.value, "");
  1174. res.value = LLVMBuildAnd(p->builder, lhs.value, new_rhs, "");
  1175. return res;
  1176. }
  1177. break;
  1178. }
  1179. GB_PANIC("unhandled operator of lb_emit_arith");
  1180. return {};
  1181. }
  1182. gb_internal bool lb_is_empty_string_constant(Ast *expr) {
  1183. if (expr->tav.value.kind == ExactValue_String &&
  1184. is_type_string(expr->tav.type)) {
  1185. String s = expr->tav.value.value_string;
  1186. return s.len == 0;
  1187. }
  1188. return false;
  1189. }
  1190. gb_internal lbValue lb_build_binary_in(lbProcedure *p, lbValue left, lbValue right, TokenKind op) {
  1191. Type *rt = base_type(right.type);
  1192. if (is_type_pointer(rt)) {
  1193. right = lb_emit_load(p, right);
  1194. rt = base_type(type_deref(rt));
  1195. }
  1196. switch (rt->kind) {
  1197. case Type_Map:
  1198. {
  1199. lbValue map_ptr = lb_address_from_load_or_generate_local(p, right);
  1200. lbValue key = left;
  1201. lbValue ptr = lb_internal_dynamic_map_get_ptr(p, map_ptr, key);
  1202. if (op == Token_in) {
  1203. return lb_emit_conv(p, lb_emit_comp_against_nil(p, Token_NotEq, ptr), t_bool);
  1204. } else {
  1205. return lb_emit_conv(p, lb_emit_comp_against_nil(p, Token_CmpEq, ptr), t_bool);
  1206. }
  1207. }
  1208. break;
  1209. case Type_BitSet:
  1210. {
  1211. Type *key_type = rt->BitSet.elem;
  1212. GB_ASSERT(are_types_identical(left.type, key_type));
  1213. Type *it = bit_set_to_int(rt);
  1214. left = lb_emit_conv(p, left, it);
  1215. if (is_type_different_to_arch_endianness(it)) {
  1216. left = lb_emit_byte_swap(p, left, integer_endian_type_to_platform_type(it));
  1217. }
  1218. lbValue lower = lb_const_value(p->module, left.type, exact_value_i64(rt->BitSet.lower));
  1219. lbValue key = lb_emit_arith(p, Token_Sub, left, lower, left.type);
  1220. lbValue bit = lb_emit_arith(p, Token_Shl, lb_const_int(p->module, left.type, 1), key, left.type);
  1221. bit = lb_emit_conv(p, bit, it);
  1222. lbValue old_value = lb_emit_transmute(p, right, it);
  1223. lbValue new_value = lb_emit_arith(p, Token_And, old_value, bit, it);
  1224. if (op == Token_in) {
  1225. return lb_emit_conv(p, lb_emit_comp(p, Token_NotEq, new_value, lb_const_int(p->module, new_value.type, 0)), t_bool);
  1226. } else {
  1227. return lb_emit_conv(p, lb_emit_comp(p, Token_CmpEq, new_value, lb_const_int(p->module, new_value.type, 0)), t_bool);
  1228. }
  1229. }
  1230. break;
  1231. }
  1232. GB_PANIC("Invalid 'in' type");
  1233. return {};
  1234. }
  1235. gb_internal lbValue lb_build_binary_expr(lbProcedure *p, Ast *expr) {
  1236. ast_node(be, BinaryExpr, expr);
  1237. TypeAndValue tv = type_and_value_of_expr(expr);
  1238. if (is_type_matrix(be->left->tav.type) || is_type_matrix(be->right->tav.type)) {
  1239. lbValue left = lb_build_expr(p, be->left);
  1240. lbValue right = lb_build_expr(p, be->right);
  1241. return lb_emit_arith_matrix(p, be->op.kind, left, right, default_type(tv.type), false);
  1242. }
  1243. switch (be->op.kind) {
  1244. case Token_Add:
  1245. case Token_Sub:
  1246. case Token_Mul:
  1247. case Token_Quo:
  1248. case Token_Mod:
  1249. case Token_ModMod:
  1250. case Token_And:
  1251. case Token_Or:
  1252. case Token_Xor:
  1253. case Token_AndNot: {
  1254. Type *type = default_type(tv.type);
  1255. lbValue left = lb_build_expr(p, be->left);
  1256. lbValue right = lb_build_expr(p, be->right);
  1257. return lb_emit_arith(p, be->op.kind, left, right, type);
  1258. }
  1259. case Token_Shl:
  1260. case Token_Shr: {
  1261. lbValue left, right;
  1262. Type *type = default_type(tv.type);
  1263. left = lb_build_expr(p, be->left);
  1264. if (lb_is_expr_untyped_const(be->right)) {
  1265. // NOTE(bill): RHS shift operands can still be untyped
  1266. // Just bypass the standard lb_build_expr
  1267. right = lb_expr_untyped_const_to_typed(p->module, be->right, type);
  1268. } else {
  1269. right = lb_build_expr(p, be->right);
  1270. }
  1271. return lb_emit_arith(p, be->op.kind, left, right, type);
  1272. }
  1273. case Token_CmpEq:
  1274. case Token_NotEq:
  1275. if (is_type_untyped_nil(be->right->tav.type)) {
  1276. // `x == nil` or `x != nil`
  1277. lbValue left = lb_build_expr(p, be->left);
  1278. lbValue cmp = lb_emit_comp_against_nil(p, be->op.kind, left);
  1279. Type *type = default_type(tv.type);
  1280. return lb_emit_conv(p, cmp, type);
  1281. } else if (is_type_untyped_nil(be->left->tav.type)) {
  1282. // `nil == x` or `nil != x`
  1283. lbValue right = lb_build_expr(p, be->right);
  1284. lbValue cmp = lb_emit_comp_against_nil(p, be->op.kind, right);
  1285. Type *type = default_type(tv.type);
  1286. return lb_emit_conv(p, cmp, type);
  1287. } else if (lb_is_empty_string_constant(be->right)) {
  1288. // `x == ""` or `x != ""`
  1289. lbValue s = lb_build_expr(p, be->left);
  1290. s = lb_emit_conv(p, s, t_string);
  1291. lbValue len = lb_string_len(p, s);
  1292. lbValue cmp = lb_emit_comp(p, be->op.kind, len, lb_const_int(p->module, t_int, 0));
  1293. Type *type = default_type(tv.type);
  1294. return lb_emit_conv(p, cmp, type);
  1295. } else if (lb_is_empty_string_constant(be->left)) {
  1296. // `"" == x` or `"" != x`
  1297. lbValue s = lb_build_expr(p, be->right);
  1298. s = lb_emit_conv(p, s, t_string);
  1299. lbValue len = lb_string_len(p, s);
  1300. lbValue cmp = lb_emit_comp(p, be->op.kind, len, lb_const_int(p->module, t_int, 0));
  1301. Type *type = default_type(tv.type);
  1302. return lb_emit_conv(p, cmp, type);
  1303. }
  1304. /*fallthrough*/
  1305. case Token_Lt:
  1306. case Token_LtEq:
  1307. case Token_Gt:
  1308. case Token_GtEq:
  1309. {
  1310. lbValue left = {};
  1311. lbValue right = {};
  1312. if (be->left->tav.mode == Addressing_Type) {
  1313. left = lb_typeid(p->module, be->left->tav.type);
  1314. }
  1315. if (be->right->tav.mode == Addressing_Type) {
  1316. right = lb_typeid(p->module, be->right->tav.type);
  1317. }
  1318. if (left.value == nullptr) left = lb_build_expr(p, be->left);
  1319. if (right.value == nullptr) right = lb_build_expr(p, be->right);
  1320. lbValue cmp = lb_emit_comp(p, be->op.kind, left, right);
  1321. Type *type = default_type(tv.type);
  1322. return lb_emit_conv(p, cmp, type);
  1323. }
  1324. case Token_CmpAnd:
  1325. case Token_CmpOr:
  1326. return lb_emit_logical_binary_expr(p, be->op.kind, be->left, be->right, tv.type);
  1327. case Token_in:
  1328. case Token_not_in:
  1329. {
  1330. lbValue left = lb_build_expr(p, be->left);
  1331. lbValue right = lb_build_expr(p, be->right);
  1332. return lb_build_binary_in(p, left, right, be->op.kind);
  1333. }
  1334. default:
  1335. GB_PANIC("Invalid binary expression");
  1336. break;
  1337. }
  1338. return {};
  1339. }
  1340. gb_internal lbValue lb_emit_conv(lbProcedure *p, lbValue value, Type *t) {
  1341. lbModule *m = p->module;
  1342. t = reduce_tuple_to_single_type(t);
  1343. Type *src_type = value.type;
  1344. if (are_types_identical(t, src_type)) {
  1345. return value;
  1346. }
  1347. Type *src = core_type(src_type);
  1348. Type *dst = core_type(t);
  1349. GB_ASSERT(src != nullptr);
  1350. GB_ASSERT(dst != nullptr);
  1351. if (is_type_untyped_uninit(src)) {
  1352. return lb_const_undef(m, t);
  1353. }
  1354. if (is_type_untyped_nil(src)) {
  1355. return lb_const_nil(m, t);
  1356. }
  1357. if (LLVMIsConstant(value.value)) {
  1358. if (is_type_any(dst)) {
  1359. Type *st = default_type(src_type);
  1360. lbAddr default_value = lb_add_local_generated(p, st, false);
  1361. lb_addr_store(p, default_value, value);
  1362. lbValue data = lb_emit_conv(p, default_value.addr, t_rawptr);
  1363. lbValue id = lb_typeid(m, st);
  1364. lbAddr res = lb_add_local_generated(p, t, false);
  1365. lbValue a0 = lb_emit_struct_ep(p, res.addr, 0);
  1366. lbValue a1 = lb_emit_struct_ep(p, res.addr, 1);
  1367. lb_emit_store(p, a0, data);
  1368. lb_emit_store(p, a1, id);
  1369. return lb_addr_load(p, res);
  1370. } else if (dst->kind == Type_Basic) {
  1371. if (src->Basic.kind == Basic_string && dst->Basic.kind == Basic_cstring) {
  1372. String str = lb_get_const_string(m, value);
  1373. lbValue res = {};
  1374. res.type = t;
  1375. res.value = llvm_cstring(m, str);
  1376. return res;
  1377. }
  1378. // if (is_type_float(dst)) {
  1379. // return value;
  1380. // } else if (is_type_integer(dst)) {
  1381. // return value;
  1382. // }
  1383. // ExactValue ev = value->Constant.value;
  1384. // if (is_type_float(dst)) {
  1385. // ev = exact_value_to_float(ev);
  1386. // } else if (is_type_complex(dst)) {
  1387. // ev = exact_value_to_complex(ev);
  1388. // } else if (is_type_quaternion(dst)) {
  1389. // ev = exact_value_to_quaternion(ev);
  1390. // } else if (is_type_string(dst)) {
  1391. // // Handled elsewhere
  1392. // GB_ASSERT_MSG(ev.kind == ExactValue_String, "%d", ev.kind);
  1393. // } else if (is_type_integer(dst)) {
  1394. // ev = exact_value_to_integer(ev);
  1395. // } else if (is_type_pointer(dst)) {
  1396. // // IMPORTANT NOTE(bill): LLVM doesn't support pointer constants expect 'null'
  1397. // lbValue i = lb_add_module_constant(p->module, t_uintptr, ev);
  1398. // return lb_emit(p, lb_instr_conv(p, irConv_inttoptr, i, t_uintptr, dst));
  1399. // }
  1400. // return lb_const_value(p->module, t, ev);
  1401. }
  1402. }
  1403. if (are_types_identical(src, dst)) {
  1404. if (!are_types_identical(src_type, t)) {
  1405. return lb_emit_transmute(p, value, t);
  1406. }
  1407. return value;
  1408. }
  1409. // bool <-> llvm bool
  1410. if (is_type_boolean(src) && dst == t_llvm_bool) {
  1411. lbValue res = {};
  1412. res.value = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(lb_type(m, src)), "");
  1413. res.type = t;
  1414. return res;
  1415. }
  1416. if (src == t_llvm_bool && is_type_boolean(dst)) {
  1417. lbValue res = {};
  1418. res.value = LLVMBuildZExt(p->builder, value.value, lb_type(m, dst), "");
  1419. res.type = t;
  1420. return res;
  1421. }
  1422. // integer -> integer
  1423. if (is_type_integer(src) && is_type_integer(dst)) {
  1424. GB_ASSERT(src->kind == Type_Basic &&
  1425. dst->kind == Type_Basic);
  1426. i64 sz = type_size_of(default_type(src));
  1427. i64 dz = type_size_of(default_type(dst));
  1428. if (sz == dz) {
  1429. if (dz > 1 && !types_have_same_internal_endian(src, dst)) {
  1430. return lb_emit_byte_swap(p, value, t);
  1431. }
  1432. lbValue res = {};
  1433. res.value = value.value;
  1434. res.type = t;
  1435. return res;
  1436. }
  1437. if (sz > 1 && is_type_different_to_arch_endianness(src)) {
  1438. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1439. value = lb_emit_byte_swap(p, value, platform_src_type);
  1440. }
  1441. LLVMOpcode op = LLVMTrunc;
  1442. if (dz < sz) {
  1443. op = LLVMTrunc;
  1444. } else if (dz == sz) {
  1445. // NOTE(bill): In LLVM, all integers are signed and rely upon 2's compliment
  1446. // NOTE(bill): Copy the value just for type correctness
  1447. op = LLVMBitCast;
  1448. } else if (dz > sz) {
  1449. op = is_type_unsigned(src) ? LLVMZExt : LLVMSExt; // zero extent
  1450. }
  1451. if (dz > 1 && is_type_different_to_arch_endianness(dst)) {
  1452. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1453. lbValue res = {};
  1454. res.value = LLVMBuildCast(p->builder, op, value.value, lb_type(m, platform_dst_type), "");
  1455. res.type = t;
  1456. return lb_emit_byte_swap(p, res, t);
  1457. } else {
  1458. lbValue res = {};
  1459. res.value = LLVMBuildCast(p->builder, op, value.value, lb_type(m, t), "");
  1460. res.type = t;
  1461. return res;
  1462. }
  1463. }
  1464. // boolean -> boolean/integer
  1465. if (is_type_boolean(src) && (is_type_boolean(dst) || is_type_integer(dst))) {
  1466. LLVMValueRef b = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(lb_type(m, value.type)), "");
  1467. lbValue res = {};
  1468. res.value = LLVMBuildIntCast2(p->builder, b, lb_type(m, t), false, "");
  1469. res.type = t;
  1470. return res;
  1471. }
  1472. if (is_type_cstring(src) && is_type_u8_ptr(dst)) {
  1473. return lb_emit_transmute(p, value, dst);
  1474. }
  1475. if (is_type_u8_ptr(src) && is_type_cstring(dst)) {
  1476. return lb_emit_transmute(p, value, dst);
  1477. }
  1478. if (is_type_cstring(src) && is_type_u8_multi_ptr(dst)) {
  1479. return lb_emit_transmute(p, value, dst);
  1480. }
  1481. if (is_type_u8_multi_ptr(src) && is_type_cstring(dst)) {
  1482. return lb_emit_transmute(p, value, dst);
  1483. }
  1484. if (is_type_cstring(src) && is_type_rawptr(dst)) {
  1485. return lb_emit_transmute(p, value, dst);
  1486. }
  1487. if (is_type_rawptr(src) && is_type_cstring(dst)) {
  1488. return lb_emit_transmute(p, value, dst);
  1489. }
  1490. if (are_types_identical(src, t_cstring) && are_types_identical(dst, t_string)) {
  1491. TEMPORARY_ALLOCATOR_GUARD();
  1492. lbValue c = lb_emit_conv(p, value, t_cstring);
  1493. auto args = array_make<lbValue>(temporary_allocator(), 1);
  1494. args[0] = c;
  1495. lbValue s = lb_emit_runtime_call(p, "cstring_to_string", args);
  1496. return lb_emit_conv(p, s, dst);
  1497. }
  1498. // integer -> boolean
  1499. if (is_type_integer(src) && is_type_boolean(dst)) {
  1500. lbValue res = {};
  1501. res.value = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(lb_type(m, value.type)), "");
  1502. res.type = t_llvm_bool;
  1503. return lb_emit_conv(p, res, t);
  1504. }
  1505. // float -> float
  1506. if (is_type_float(src) && is_type_float(dst)) {
  1507. i64 sz = type_size_of(src);
  1508. i64 dz = type_size_of(dst);
  1509. if (dz == sz) {
  1510. if (types_have_same_internal_endian(src, dst)) {
  1511. lbValue res = {};
  1512. res.type = t;
  1513. res.value = value.value;
  1514. return res;
  1515. } else {
  1516. return lb_emit_byte_swap(p, value, t);
  1517. }
  1518. }
  1519. if (is_type_different_to_arch_endianness(src) || is_type_different_to_arch_endianness(dst)) {
  1520. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1521. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1522. lbValue res = {};
  1523. res = lb_emit_conv(p, value, platform_src_type);
  1524. res = lb_emit_conv(p, res, platform_dst_type);
  1525. if (is_type_different_to_arch_endianness(dst)) {
  1526. res = lb_emit_byte_swap(p, res, t);
  1527. }
  1528. return lb_emit_conv(p, res, t);
  1529. }
  1530. lbValue res = {};
  1531. res.type = t;
  1532. if (dz >= sz) {
  1533. res.value = LLVMBuildFPExt(p->builder, value.value, lb_type(m, t), "");
  1534. } else {
  1535. res.value = LLVMBuildFPTrunc(p->builder, value.value, lb_type(m, t), "");
  1536. }
  1537. return res;
  1538. }
  1539. if (is_type_complex(src) && is_type_complex(dst)) {
  1540. Type *ft = base_complex_elem_type(dst);
  1541. lbAddr gen = lb_add_local_generated(p, t, false);
  1542. lbValue gp = lb_addr_get_ptr(p, gen);
  1543. lbValue real = lb_emit_conv(p, lb_emit_struct_ev(p, value, 0), ft);
  1544. lbValue imag = lb_emit_conv(p, lb_emit_struct_ev(p, value, 1), ft);
  1545. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), real);
  1546. lb_emit_store(p, lb_emit_struct_ep(p, gp, 1), imag);
  1547. return lb_addr_load(p, gen);
  1548. }
  1549. if (is_type_quaternion(src) && is_type_quaternion(dst)) {
  1550. // @QuaternionLayout
  1551. Type *ft = base_complex_elem_type(dst);
  1552. lbAddr gen = lb_add_local_generated(p, t, false);
  1553. lbValue gp = lb_addr_get_ptr(p, gen);
  1554. lbValue q0 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 0), ft);
  1555. lbValue q1 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 1), ft);
  1556. lbValue q2 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 2), ft);
  1557. lbValue q3 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 3), ft);
  1558. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), q0);
  1559. lb_emit_store(p, lb_emit_struct_ep(p, gp, 1), q1);
  1560. lb_emit_store(p, lb_emit_struct_ep(p, gp, 2), q2);
  1561. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), q3);
  1562. return lb_addr_load(p, gen);
  1563. }
  1564. if (is_type_integer(src) && is_type_complex(dst)) {
  1565. Type *ft = base_complex_elem_type(dst);
  1566. lbAddr gen = lb_add_local_generated(p, t, true);
  1567. lbValue gp = lb_addr_get_ptr(p, gen);
  1568. lbValue real = lb_emit_conv(p, value, ft);
  1569. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), real);
  1570. return lb_addr_load(p, gen);
  1571. }
  1572. if (is_type_float(src) && is_type_complex(dst)) {
  1573. Type *ft = base_complex_elem_type(dst);
  1574. lbAddr gen = lb_add_local_generated(p, t, true);
  1575. lbValue gp = lb_addr_get_ptr(p, gen);
  1576. lbValue real = lb_emit_conv(p, value, ft);
  1577. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), real);
  1578. return lb_addr_load(p, gen);
  1579. }
  1580. if (is_type_integer(src) && is_type_quaternion(dst)) {
  1581. Type *ft = base_complex_elem_type(dst);
  1582. lbAddr gen = lb_add_local_generated(p, t, true);
  1583. lbValue gp = lb_addr_get_ptr(p, gen);
  1584. lbValue real = lb_emit_conv(p, value, ft);
  1585. // @QuaternionLayout
  1586. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), real);
  1587. return lb_addr_load(p, gen);
  1588. }
  1589. if (is_type_float(src) && is_type_quaternion(dst)) {
  1590. Type *ft = base_complex_elem_type(dst);
  1591. lbAddr gen = lb_add_local_generated(p, t, true);
  1592. lbValue gp = lb_addr_get_ptr(p, gen);
  1593. lbValue real = lb_emit_conv(p, value, ft);
  1594. // @QuaternionLayout
  1595. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), real);
  1596. return lb_addr_load(p, gen);
  1597. }
  1598. if (is_type_complex(src) && is_type_quaternion(dst)) {
  1599. Type *ft = base_complex_elem_type(dst);
  1600. lbAddr gen = lb_add_local_generated(p, t, true);
  1601. lbValue gp = lb_addr_get_ptr(p, gen);
  1602. lbValue real = lb_emit_conv(p, lb_emit_struct_ev(p, value, 0), ft);
  1603. lbValue imag = lb_emit_conv(p, lb_emit_struct_ev(p, value, 1), ft);
  1604. // @QuaternionLayout
  1605. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), real);
  1606. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), imag);
  1607. return lb_addr_load(p, gen);
  1608. }
  1609. // float <-> integer
  1610. if (is_type_float(src) && is_type_integer(dst)) {
  1611. if (is_type_different_to_arch_endianness(src) || is_type_different_to_arch_endianness(dst)) {
  1612. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1613. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1614. lbValue res = {};
  1615. res = lb_emit_conv(p, value, platform_src_type);
  1616. res = lb_emit_conv(p, res, platform_dst_type);
  1617. return lb_emit_conv(p, res, t);
  1618. }
  1619. if (is_type_integer_128bit(dst)) {
  1620. TEMPORARY_ALLOCATOR_GUARD();
  1621. auto args = array_make<lbValue>(temporary_allocator(), 1);
  1622. args[0] = value;
  1623. char const *call = "fixunsdfdi";
  1624. if (is_type_unsigned(dst)) {
  1625. call = "fixunsdfti";
  1626. }
  1627. lbValue res_i128 = lb_emit_runtime_call(p, call, args);
  1628. return lb_emit_conv(p, res_i128, t);
  1629. }
  1630. i64 sz = type_size_of(src);
  1631. lbValue res = {};
  1632. res.type = t;
  1633. if (is_type_unsigned(dst)) {
  1634. switch (sz) {
  1635. case 2:
  1636. case 4:
  1637. res.value = LLVMBuildFPToUI(p->builder, value.value, lb_type(m, t_u32), "");
  1638. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), false, "");
  1639. break;
  1640. case 8:
  1641. res.value = LLVMBuildFPToUI(p->builder, value.value, lb_type(m, t_u64), "");
  1642. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), false, "");
  1643. break;
  1644. default:
  1645. GB_PANIC("Unhandled float type");
  1646. break;
  1647. }
  1648. } else {
  1649. switch (sz) {
  1650. case 2:
  1651. case 4:
  1652. res.value = LLVMBuildFPToSI(p->builder, value.value, lb_type(m, t_i32), "");
  1653. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), true, "");
  1654. break;
  1655. case 8:
  1656. res.value = LLVMBuildFPToSI(p->builder, value.value, lb_type(m, t_i64), "");
  1657. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), true, "");
  1658. break;
  1659. default:
  1660. GB_PANIC("Unhandled float type");
  1661. break;
  1662. }
  1663. }
  1664. return res;
  1665. }
  1666. if (is_type_integer(src) && is_type_float(dst)) {
  1667. if (is_type_different_to_arch_endianness(src) || is_type_different_to_arch_endianness(dst)) {
  1668. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1669. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1670. lbValue res = {};
  1671. res = lb_emit_conv(p, value, platform_src_type);
  1672. res = lb_emit_conv(p, res, platform_dst_type);
  1673. if (is_type_different_to_arch_endianness(dst)) {
  1674. res = lb_emit_byte_swap(p, res, t);
  1675. }
  1676. return lb_emit_conv(p, res, t);
  1677. }
  1678. if (is_type_integer_128bit(src)) {
  1679. TEMPORARY_ALLOCATOR_GUARD();
  1680. auto args = array_make<lbValue>(temporary_allocator(), 1);
  1681. args[0] = value;
  1682. char const *call = "floattidf";
  1683. if (is_type_unsigned(src)) {
  1684. call = "floattidf_unsigned";
  1685. }
  1686. lbValue res_f64 = lb_emit_runtime_call(p, call, args);
  1687. return lb_emit_conv(p, res_f64, t);
  1688. }
  1689. lbValue res = {};
  1690. res.type = t;
  1691. if (is_type_unsigned(src)) {
  1692. res.value = LLVMBuildUIToFP(p->builder, value.value, lb_type(m, t), "");
  1693. } else {
  1694. res.value = LLVMBuildSIToFP(p->builder, value.value, lb_type(m, t), "");
  1695. }
  1696. return res;
  1697. }
  1698. if (is_type_simd_vector(dst)) {
  1699. Type *et = base_array_type(dst);
  1700. if (is_type_simd_vector(src)) {
  1701. Type *src_elem = core_array_type(src);
  1702. Type *dst_elem = core_array_type(dst);
  1703. GB_ASSERT(src->SimdVector.count == dst->SimdVector.count);
  1704. lbValue res = {};
  1705. res.type = t;
  1706. if (are_types_identical(src_elem, dst_elem)) {
  1707. res.value = value.value;
  1708. } else if (is_type_float(src_elem) && is_type_integer(dst_elem)) {
  1709. if (is_type_unsigned(dst_elem)) {
  1710. res.value = LLVMBuildFPToUI(p->builder, value.value, lb_type(m, t), "");
  1711. } else {
  1712. res.value = LLVMBuildFPToSI(p->builder, value.value, lb_type(m, t), "");
  1713. }
  1714. } else if (is_type_integer(src_elem) && is_type_float(dst_elem)) {
  1715. if (is_type_unsigned(src_elem)) {
  1716. res.value = LLVMBuildUIToFP(p->builder, value.value, lb_type(m, t), "");
  1717. } else {
  1718. res.value = LLVMBuildSIToFP(p->builder, value.value, lb_type(m, t), "");
  1719. }
  1720. } else if ((is_type_integer(src_elem) || is_type_boolean(src_elem)) && is_type_integer(dst_elem)) {
  1721. res.value = LLVMBuildIntCast2(p->builder, value.value, lb_type(m, t), !is_type_unsigned(src_elem), "");
  1722. } else if (is_type_float(src_elem) && is_type_float(dst_elem)) {
  1723. res.value = LLVMBuildFPCast(p->builder, value.value, lb_type(m, t), "");
  1724. } else if (is_type_integer(src_elem) && is_type_boolean(dst_elem)) {
  1725. LLVMValueRef i1vector = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(LLVMTypeOf(value.value)), "");
  1726. res.value = LLVMBuildIntCast2(p->builder, i1vector, lb_type(m, t), !is_type_unsigned(src_elem), "");
  1727. } else if (is_type_pointer(src_elem) && is_type_integer(dst_elem)) {
  1728. res.value = LLVMBuildPtrToInt(p->builder, value.value, lb_type(m, t), "");
  1729. } else if (is_type_integer(src_elem) && is_type_pointer(dst_elem)) {
  1730. res.value = LLVMBuildIntToPtr(p->builder, value.value, lb_type(m, t), "");
  1731. }else {
  1732. GB_PANIC("Unhandled simd vector conversion: %s -> %s", type_to_string(src), type_to_string(dst));
  1733. }
  1734. return res;
  1735. } else {
  1736. i64 count = get_array_type_count(dst);
  1737. LLVMTypeRef vt = lb_type(m, t);
  1738. LLVMTypeRef llvm_u32 = lb_type(m, t_u32);
  1739. LLVMValueRef elem = lb_emit_conv(p, value, et).value;
  1740. LLVMValueRef vector = LLVMConstNull(vt);
  1741. for (i64 i = 0; i < count; i++) {
  1742. LLVMValueRef idx = LLVMConstInt(llvm_u32, i, false);
  1743. vector = LLVMBuildInsertElement(p->builder, vector, elem, idx, "");
  1744. }
  1745. lbValue res = {};
  1746. res.type = t;
  1747. res.value = vector;
  1748. return res;
  1749. }
  1750. }
  1751. // bit_field <-> backing type
  1752. if (is_type_bit_field(src)) {
  1753. if (are_types_identical(src->BitField.backing_type, dst)) {
  1754. lbValue res = {};
  1755. res.type = t;
  1756. res.value = value.value;
  1757. return res;
  1758. }
  1759. }
  1760. if (is_type_bit_field(dst)) {
  1761. if (are_types_identical(src, dst->BitField.backing_type)) {
  1762. lbValue res = {};
  1763. res.type = t;
  1764. res.value = value.value;
  1765. return res;
  1766. }
  1767. }
  1768. // bit_set <-> backing type
  1769. if (is_type_bit_set(src)) {
  1770. Type *backing = bit_set_to_int(src);
  1771. if (are_types_identical(backing, dst)) {
  1772. lbValue res = {};
  1773. res.type = t;
  1774. res.value = value.value;
  1775. return res;
  1776. }
  1777. }
  1778. if (is_type_bit_set(dst)) {
  1779. Type *backing = bit_set_to_int(dst);
  1780. if (are_types_identical(src, backing)) {
  1781. lbValue res = {};
  1782. res.type = t;
  1783. res.value = value.value;
  1784. return res;
  1785. }
  1786. }
  1787. // Pointer <-> uintptr
  1788. if (is_type_pointer(src) && is_type_uintptr(dst)) {
  1789. lbValue res = {};
  1790. res.type = t;
  1791. res.value = LLVMBuildPtrToInt(p->builder, value.value, lb_type(m, t), "");
  1792. return res;
  1793. }
  1794. if (is_type_uintptr(src) && is_type_pointer(dst)) {
  1795. lbValue res = {};
  1796. res.type = t;
  1797. res.value = LLVMBuildIntToPtr(p->builder, value.value, lb_type(m, t), "");
  1798. return res;
  1799. }
  1800. if (is_type_multi_pointer(src) && is_type_uintptr(dst)) {
  1801. lbValue res = {};
  1802. res.type = t;
  1803. res.value = LLVMBuildPtrToInt(p->builder, value.value, lb_type(m, t), "");
  1804. return res;
  1805. }
  1806. if (is_type_uintptr(src) && is_type_multi_pointer(dst)) {
  1807. lbValue res = {};
  1808. res.type = t;
  1809. res.value = LLVMBuildIntToPtr(p->builder, value.value, lb_type(m, t), "");
  1810. return res;
  1811. }
  1812. if (is_type_union(dst)) {
  1813. if (dst->Union.variants.count == 1) {
  1814. Type *vt = dst->Union.variants[0];
  1815. if (internal_check_is_assignable_to(src_type, vt)) {
  1816. value = lb_emit_conv(p, value, vt);
  1817. lbAddr parent = lb_add_local_generated(p, t, true);
  1818. lb_emit_store_union_variant(p, parent.addr, value, vt);
  1819. return lb_addr_load(p, parent);
  1820. }
  1821. }
  1822. for (Type *vt : dst->Union.variants) {
  1823. if (are_types_identical(src_type, vt)) {
  1824. lbAddr parent = lb_add_local_generated(p, t, true);
  1825. lb_emit_store_union_variant(p, parent.addr, value, vt);
  1826. return lb_addr_load(p, parent);
  1827. }
  1828. }
  1829. ValidIndexAndScore *valids = gb_alloc_array(temporary_allocator(), ValidIndexAndScore, dst->Union.variants.count);
  1830. isize valid_count = 0;
  1831. isize first_success_index = -1;
  1832. for_array(i, dst->Union.variants) {
  1833. Type *vt = dst->Union.variants[i];
  1834. i64 score = 0;
  1835. if (internal_check_is_assignable_to(src_type, vt)) {
  1836. valids[valid_count].index = i;
  1837. valids[valid_count].score = score;
  1838. valid_count += 1;
  1839. if (first_success_index < 0) {
  1840. first_success_index = i;
  1841. }
  1842. }
  1843. }
  1844. if (valid_count > 1) {
  1845. gb_sort_array(valids, valid_count, valid_index_and_score_cmp);
  1846. i64 best_score = valids[0].score;
  1847. for (isize i = 1; i < valid_count; i++) {
  1848. auto v = valids[i];
  1849. if (best_score > v.score) {
  1850. valid_count = i;
  1851. break;
  1852. }
  1853. best_score = v.score;
  1854. }
  1855. first_success_index = valids[0].index;
  1856. }
  1857. if (valid_count == 1) {
  1858. Type *vt = dst->Union.variants[first_success_index];
  1859. value = lb_emit_conv(p, value, vt);
  1860. lbAddr parent = lb_add_local_generated(p, t, true);
  1861. lb_emit_store_union_variant(p, parent.addr, value, vt);
  1862. return lb_addr_load(p, parent);
  1863. }
  1864. }
  1865. // NOTE(bill): This has to be done before 'Pointer <-> Pointer' as it's
  1866. // subtype polymorphism casting
  1867. if (check_is_assignable_to_using_subtype(src_type, t)) {
  1868. Type *st = type_deref(src_type);
  1869. st = type_deref(st);
  1870. bool st_is_ptr = is_type_pointer(src_type);
  1871. st = base_type(st);
  1872. Type *dt = t;
  1873. GB_ASSERT(is_type_struct(st) || is_type_raw_union(st));
  1874. Selection sel = {};
  1875. sel.index.allocator = heap_allocator();
  1876. defer (array_free(&sel.index));
  1877. if (lookup_subtype_polymorphic_selection(t, src_type, &sel)) {
  1878. if (sel.entity == nullptr) {
  1879. GB_PANIC("invalid subtype cast %s -> ", type_to_string(src_type), type_to_string(t));
  1880. }
  1881. if (st_is_ptr) {
  1882. lbValue res = lb_emit_deep_field_gep(p, value, sel);
  1883. Type *rt = res.type;
  1884. if (!are_types_identical(rt, dt) && are_types_identical(type_deref(rt), dt)) {
  1885. res = lb_emit_load(p, res);
  1886. }
  1887. return res;
  1888. } else {
  1889. if (is_type_pointer(value.type)) {
  1890. Type *rt = value.type;
  1891. if (!are_types_identical(rt, dt) && are_types_identical(type_deref(rt), dt)) {
  1892. value = lb_emit_load(p, value);
  1893. } else {
  1894. value = lb_emit_deep_field_gep(p, value, sel);
  1895. return lb_emit_load(p, value);
  1896. }
  1897. }
  1898. return lb_emit_deep_field_ev(p, value, sel);
  1899. }
  1900. }
  1901. }
  1902. // Pointer <-> Pointer
  1903. if (is_type_pointer(src) && is_type_pointer(dst)) {
  1904. lbValue res = {};
  1905. res.type = t;
  1906. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1907. return res;
  1908. }
  1909. if (is_type_multi_pointer(src) && is_type_pointer(dst)) {
  1910. lbValue res = {};
  1911. res.type = t;
  1912. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1913. return res;
  1914. }
  1915. if (is_type_pointer(src) && is_type_multi_pointer(dst)) {
  1916. lbValue res = {};
  1917. res.type = t;
  1918. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1919. return res;
  1920. }
  1921. if (is_type_multi_pointer(src) && is_type_multi_pointer(dst)) {
  1922. lbValue res = {};
  1923. res.type = t;
  1924. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1925. return res;
  1926. }
  1927. // proc <-> proc
  1928. if (is_type_proc(src) && is_type_proc(dst)) {
  1929. lbValue res = {};
  1930. res.type = t;
  1931. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1932. return res;
  1933. }
  1934. // pointer -> proc
  1935. if (is_type_pointer(src) && is_type_proc(dst)) {
  1936. lbValue res = {};
  1937. res.type = t;
  1938. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1939. return res;
  1940. }
  1941. // proc -> pointer
  1942. if (is_type_proc(src) && is_type_pointer(dst)) {
  1943. lbValue res = {};
  1944. res.type = t;
  1945. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1946. return res;
  1947. }
  1948. // []byte/[]u8 <-> string
  1949. if (is_type_u8_slice(src) && is_type_string(dst)) {
  1950. return lb_emit_transmute(p, value, t);
  1951. }
  1952. if (is_type_string(src) && is_type_u8_slice(dst)) {
  1953. return lb_emit_transmute(p, value, t);
  1954. }
  1955. if (is_type_array_like(dst)) {
  1956. Type *elem = base_array_type(dst);
  1957. isize index_count = cast(isize)get_array_type_count(dst);
  1958. isize inlineable = type_size_of(dst) <= build_context.max_simd_align;
  1959. lbValue e = lb_emit_conv(p, value, elem);
  1960. if (inlineable && lb_is_const(e)) {
  1961. lbAddr v = {};
  1962. if (e.value) {
  1963. TEMPORARY_ALLOCATOR_GUARD();
  1964. LLVMValueRef *values = gb_alloc_array(temporary_allocator(), LLVMValueRef, index_count);
  1965. for (isize i = 0; i < index_count; i++) {
  1966. values[i] = e.value;
  1967. }
  1968. lbValue array_const_value = {};
  1969. array_const_value.type = t;
  1970. array_const_value.value = LLVMConstArray(lb_type(m, elem), values, cast(unsigned)index_count);
  1971. v = lb_add_global_generated(m, t, array_const_value);
  1972. } else {
  1973. v = lb_add_global_generated(m, t);
  1974. }
  1975. lb_make_global_private_const(v);
  1976. return lb_addr_load(p, v);
  1977. }
  1978. // NOTE(bill): Doesn't need to be zero because it will be initialized in the loops
  1979. lbAddr v = lb_add_local_generated(p, t, false);
  1980. if (!inlineable) {
  1981. auto loop_data = lb_loop_start(p, index_count, t_int);
  1982. lbValue elem = lb_emit_array_ep(p, v.addr, loop_data.idx);
  1983. lb_emit_store(p, elem, e);
  1984. lb_loop_end(p, loop_data);
  1985. } else {
  1986. for (isize i = 0; i < index_count; i++) {
  1987. lbValue elem = lb_emit_array_epi(p, v.addr, i);
  1988. lb_emit_store(p, elem, e);
  1989. }
  1990. }
  1991. return lb_addr_load(p, v);
  1992. }
  1993. if (is_type_matrix(dst) && !is_type_matrix(src)) {
  1994. GB_ASSERT_MSG(dst->Matrix.row_count == dst->Matrix.column_count, "%s <- %s", type_to_string(dst), type_to_string(src));
  1995. Type *elem = base_array_type(dst);
  1996. lbValue e = lb_emit_conv(p, value, elem);
  1997. lbAddr v = lb_add_local_generated(p, t, false);
  1998. lbValue zero = lb_const_value(p->module, elem, exact_value_i64(0), true);
  1999. for (i64 j = 0; j < dst->Matrix.column_count; j++) {
  2000. for (i64 i = 0; i < dst->Matrix.row_count; i++) {
  2001. lbValue ptr = lb_emit_matrix_epi(p, v.addr, i, j);
  2002. lb_emit_store(p, ptr, i == j ? e : zero);
  2003. }
  2004. }
  2005. return lb_addr_load(p, v);
  2006. }
  2007. if (is_type_matrix(dst) && is_type_matrix(src)) {
  2008. GB_ASSERT(dst->kind == Type_Matrix);
  2009. GB_ASSERT(src->kind == Type_Matrix);
  2010. lbAddr v = lb_add_local_generated(p, t, true);
  2011. if (is_matrix_square(dst) && is_matrix_square(dst)) {
  2012. for (i64 j = 0; j < dst->Matrix.column_count; j++) {
  2013. for (i64 i = 0; i < dst->Matrix.row_count; i++) {
  2014. if (i < src->Matrix.row_count && j < src->Matrix.column_count) {
  2015. lbValue d = lb_emit_matrix_epi(p, v.addr, i, j);
  2016. lbValue s = lb_emit_matrix_ev(p, value, i, j);
  2017. lb_emit_store(p, d, s);
  2018. } else if (i == j) {
  2019. lbValue d = lb_emit_matrix_epi(p, v.addr, i, j);
  2020. lbValue s = lb_const_value(p->module, dst->Matrix.elem, exact_value_i64(1), true);
  2021. lb_emit_store(p, d, s);
  2022. }
  2023. }
  2024. }
  2025. } else {
  2026. i64 dst_count = dst->Matrix.row_count*dst->Matrix.column_count;
  2027. i64 src_count = src->Matrix.row_count*src->Matrix.column_count;
  2028. GB_ASSERT(dst_count == src_count);
  2029. lbValue pdst = v.addr;
  2030. lbValue psrc = lb_address_from_load_or_generate_local(p, value);
  2031. bool same_elem_base_types = are_types_identical(
  2032. base_type(dst->Matrix.elem),
  2033. base_type(src->Matrix.elem)
  2034. );
  2035. if (same_elem_base_types && type_size_of(dst) == type_size_of(src)) {
  2036. lb_mem_copy_overlapping(p, v.addr, psrc, lb_const_int(p->module, t_int, type_size_of(dst)));
  2037. } else {
  2038. for (i64 i = 0; i < src_count; i++) {
  2039. lbValue dp = lb_emit_array_epi(p, v.addr, matrix_column_major_index_to_offset(dst, i));
  2040. lbValue sp = lb_emit_array_epi(p, psrc, matrix_column_major_index_to_offset(src, i));
  2041. lbValue s = lb_emit_load(p, sp);
  2042. s = lb_emit_conv(p, s, dst->Matrix.elem);
  2043. lb_emit_store(p, dp, s);
  2044. }
  2045. }
  2046. }
  2047. return lb_addr_load(p, v);
  2048. }
  2049. if (is_type_any(dst)) {
  2050. if (is_type_untyped_uninit(src)) {
  2051. return lb_const_undef(p->module, t);
  2052. }
  2053. if (is_type_untyped_nil(src)) {
  2054. return lb_const_nil(p->module, t);
  2055. }
  2056. lbAddr result = lb_add_local_generated(p, t, true);
  2057. Type *st = default_type(src_type);
  2058. lbValue data = lb_address_from_load_or_generate_local(p, value);
  2059. GB_ASSERT_MSG(is_type_pointer(data.type), "%s", type_to_string(data.type));
  2060. GB_ASSERT_MSG(is_type_typed(st), "%s", type_to_string(st));
  2061. data = lb_emit_conv(p, data, t_rawptr);
  2062. lbValue id = lb_typeid(p->module, st);
  2063. lbValue any_data = lb_emit_struct_ep(p, result.addr, 0);
  2064. lbValue any_id = lb_emit_struct_ep(p, result.addr, 1);
  2065. lb_emit_store(p, any_data, data);
  2066. lb_emit_store(p, any_id, id);
  2067. return lb_addr_load(p, result);
  2068. }
  2069. i64 src_sz = type_size_of(src);
  2070. i64 dst_sz = type_size_of(dst);
  2071. if (src_sz == dst_sz) {
  2072. // bit_set <-> integer
  2073. if (is_type_integer(src) && is_type_bit_set(dst)) {
  2074. lbValue res = lb_emit_conv(p, value, bit_set_to_int(dst));
  2075. res.type = t;
  2076. return res;
  2077. }
  2078. if (is_type_bit_set(src) && is_type_integer(dst)) {
  2079. lbValue bs = value;
  2080. bs.type = bit_set_to_int(src);
  2081. return lb_emit_conv(p, bs, dst);
  2082. }
  2083. // typeid <-> integer
  2084. if (is_type_integer(src) && is_type_typeid(dst)) {
  2085. return lb_emit_transmute(p, value, dst);
  2086. }
  2087. if (is_type_typeid(src) && is_type_integer(dst)) {
  2088. return lb_emit_transmute(p, value, dst);
  2089. }
  2090. }
  2091. if (is_type_untyped(src)) {
  2092. if (is_type_string(src) && is_type_string(dst)) {
  2093. lbAddr result = lb_add_local_generated(p, t, false);
  2094. lb_addr_store(p, result, value);
  2095. return lb_addr_load(p, result);
  2096. }
  2097. }
  2098. gb_printf_err("%.*s\n", LIT(p->name));
  2099. gb_printf_err("lb_emit_conv: src -> dst\n");
  2100. gb_printf_err("Not Identical %s != %s\n", type_to_string(src_type), type_to_string(t));
  2101. gb_printf_err("Not Identical %s != %s\n", type_to_string(src), type_to_string(dst));
  2102. gb_printf_err("Not Identical %p != %p\n", src_type, t);
  2103. gb_printf_err("Not Identical %p != %p\n", src, dst);
  2104. GB_PANIC("Invalid type conversion: '%s' to '%s' for procedure '%.*s'",
  2105. type_to_string(src_type), type_to_string(t),
  2106. LIT(p->name));
  2107. return {};
  2108. }
  2109. gb_internal lbValue lb_emit_c_vararg(lbProcedure *p, lbValue arg, Type *type) {
  2110. Type *core = core_type(type);
  2111. if (core->kind == Type_BitSet) {
  2112. core = core_type(bit_set_to_int(core));
  2113. arg = lb_emit_transmute(p, arg, core);
  2114. }
  2115. Type *promoted = c_vararg_promote_type(core);
  2116. return lb_emit_conv(p, arg, promoted);
  2117. }
  2118. gb_internal lbValue lb_compare_records(lbProcedure *p, TokenKind op_kind, lbValue left, lbValue right, Type *type) {
  2119. GB_ASSERT((is_type_struct(type) || is_type_union(type)) && is_type_comparable(type));
  2120. lbValue left_ptr = lb_address_from_load_or_generate_local(p, left);
  2121. lbValue right_ptr = lb_address_from_load_or_generate_local(p, right);
  2122. lbValue res = {};
  2123. if (type_size_of(type) == 0) {
  2124. switch (op_kind) {
  2125. case Token_CmpEq:
  2126. return lb_const_bool(p->module, t_bool, true);
  2127. case Token_NotEq:
  2128. return lb_const_bool(p->module, t_bool, false);
  2129. }
  2130. GB_PANIC("invalid operator");
  2131. }
  2132. TEMPORARY_ALLOCATOR_GUARD();
  2133. if (is_type_simple_compare(type)) {
  2134. // TODO(bill): Test to see if this is actually faster!!!!
  2135. auto args = array_make<lbValue>(temporary_allocator(), 3);
  2136. args[0] = lb_emit_conv(p, left_ptr, t_rawptr);
  2137. args[1] = lb_emit_conv(p, right_ptr, t_rawptr);
  2138. args[2] = lb_const_int(p->module, t_int, type_size_of(type));
  2139. res = lb_emit_runtime_call(p, "memory_equal", args);
  2140. } else {
  2141. lbValue value = lb_equal_proc_for_type(p->module, type);
  2142. auto args = array_make<lbValue>(temporary_allocator(), 2);
  2143. args[0] = lb_emit_conv(p, left_ptr, t_rawptr);
  2144. args[1] = lb_emit_conv(p, right_ptr, t_rawptr);
  2145. res = lb_emit_call(p, value, args);
  2146. }
  2147. if (op_kind == Token_NotEq) {
  2148. res = lb_emit_unary_arith(p, Token_Not, res, res.type);
  2149. }
  2150. return res;
  2151. }
  2152. gb_internal lbValue lb_emit_comp(lbProcedure *p, TokenKind op_kind, lbValue left, lbValue right) {
  2153. Type *a = core_type(left.type);
  2154. Type *b = core_type(right.type);
  2155. GB_ASSERT(gb_is_between(op_kind, Token__ComparisonBegin+1, Token__ComparisonEnd-1));
  2156. lbValue nil_check = {};
  2157. if (is_type_array_like(left.type) || is_type_array_like(right.type)) {
  2158. // don't do `nil` check if it is array-like
  2159. } else if (is_type_untyped_nil(left.type)) {
  2160. nil_check = lb_emit_comp_against_nil(p, op_kind, right);
  2161. } else if (is_type_untyped_nil(right.type)) {
  2162. nil_check = lb_emit_comp_against_nil(p, op_kind, left);
  2163. }
  2164. if (nil_check.value != nullptr) {
  2165. return nil_check;
  2166. }
  2167. if (are_types_identical(a, b)) {
  2168. // NOTE(bill): No need for a conversion
  2169. } else if (lb_is_const(left) || lb_is_const_nil(left)) {
  2170. if (lb_is_const_nil(left)) {
  2171. return lb_emit_comp_against_nil(p, op_kind, right);
  2172. }
  2173. left = lb_emit_conv(p, left, right.type);
  2174. } else if (lb_is_const(right) || lb_is_const_nil(right)) {
  2175. if (lb_is_const_nil(right)) {
  2176. return lb_emit_comp_against_nil(p, op_kind, left);
  2177. }
  2178. right = lb_emit_conv(p, right, left.type);
  2179. } else {
  2180. Type *lt = left.type;
  2181. Type *rt = right.type;
  2182. lt = left.type;
  2183. rt = right.type;
  2184. i64 ls = type_size_of(lt);
  2185. i64 rs = type_size_of(rt);
  2186. // NOTE(bill): Quick heuristic, larger types are usually the target type
  2187. if (ls < rs) {
  2188. left = lb_emit_conv(p, left, rt);
  2189. } else if (ls > rs) {
  2190. right = lb_emit_conv(p, right, lt);
  2191. } else {
  2192. if (is_type_union(rt)) {
  2193. left = lb_emit_conv(p, left, rt);
  2194. } else {
  2195. right = lb_emit_conv(p, right, lt);
  2196. }
  2197. }
  2198. }
  2199. a = core_type(left.type);
  2200. b = core_type(right.type);
  2201. if (is_type_matrix(a) && (op_kind == Token_CmpEq || op_kind == Token_NotEq)) {
  2202. Type *tl = base_type(a);
  2203. lbValue lhs = lb_address_from_load_or_generate_local(p, left);
  2204. lbValue rhs = lb_address_from_load_or_generate_local(p, right);
  2205. // TODO(bill): Test to see if this is actually faster!!!!
  2206. auto args = array_make<lbValue>(permanent_allocator(), 3);
  2207. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2208. args[1] = lb_emit_conv(p, rhs, t_rawptr);
  2209. args[2] = lb_const_int(p->module, t_int, type_size_of(tl));
  2210. lbValue val = lb_emit_runtime_call(p, "memory_compare", args);
  2211. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_nil(p->module, val.type));
  2212. return lb_emit_conv(p, res, t_bool);
  2213. }
  2214. if (is_type_array_like(a)) {
  2215. Type *tl = base_type(a);
  2216. lbValue lhs = lb_address_from_load_or_generate_local(p, left);
  2217. lbValue rhs = lb_address_from_load_or_generate_local(p, right);
  2218. TokenKind cmp_op = Token_And;
  2219. lbValue res = lb_const_bool(p->module, t_llvm_bool, true);
  2220. if (op_kind == Token_NotEq) {
  2221. res = lb_const_bool(p->module, t_llvm_bool, false);
  2222. cmp_op = Token_Or;
  2223. } else if (op_kind == Token_CmpEq) {
  2224. res = lb_const_bool(p->module, t_llvm_bool, true);
  2225. cmp_op = Token_And;
  2226. }
  2227. bool inline_array_arith = lb_can_try_to_inline_array_arith(tl);
  2228. i32 count = 0;
  2229. switch (tl->kind) {
  2230. case Type_Array: count = cast(i32)tl->Array.count; break;
  2231. case Type_EnumeratedArray: count = cast(i32)tl->EnumeratedArray.count; break;
  2232. }
  2233. if (inline_array_arith) {
  2234. // inline
  2235. lbAddr val = lb_add_local_generated(p, t_bool, false);
  2236. lb_addr_store(p, val, res);
  2237. for (i32 i = 0; i < count; i++) {
  2238. lbValue x = lb_emit_load(p, lb_emit_array_epi(p, lhs, i));
  2239. lbValue y = lb_emit_load(p, lb_emit_array_epi(p, rhs, i));
  2240. lbValue cmp = lb_emit_comp(p, op_kind, x, y);
  2241. lbValue new_res = lb_emit_arith(p, cmp_op, lb_addr_load(p, val), cmp, t_bool);
  2242. lb_addr_store(p, val, lb_emit_conv(p, new_res, t_bool));
  2243. }
  2244. return lb_addr_load(p, val);
  2245. } else {
  2246. if (is_type_simple_compare(tl) && (op_kind == Token_CmpEq || op_kind == Token_NotEq)) {
  2247. // TODO(bill): Test to see if this is actually faster!!!!
  2248. auto args = array_make<lbValue>(permanent_allocator(), 3);
  2249. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2250. args[1] = lb_emit_conv(p, rhs, t_rawptr);
  2251. args[2] = lb_const_int(p->module, t_int, type_size_of(tl));
  2252. lbValue val = lb_emit_runtime_call(p, "memory_compare", args);
  2253. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_nil(p->module, val.type));
  2254. return lb_emit_conv(p, res, t_bool);
  2255. } else {
  2256. lbAddr val = lb_add_local_generated(p, t_bool, false);
  2257. lb_addr_store(p, val, res);
  2258. auto loop_data = lb_loop_start(p, count, t_i32);
  2259. {
  2260. lbValue i = loop_data.idx;
  2261. lbValue x = lb_emit_load(p, lb_emit_array_ep(p, lhs, i));
  2262. lbValue y = lb_emit_load(p, lb_emit_array_ep(p, rhs, i));
  2263. lbValue cmp = lb_emit_comp(p, op_kind, x, y);
  2264. lbValue new_res = lb_emit_arith(p, cmp_op, lb_addr_load(p, val), cmp, t_bool);
  2265. lb_addr_store(p, val, lb_emit_conv(p, new_res, t_bool));
  2266. }
  2267. lb_loop_end(p, loop_data);
  2268. return lb_addr_load(p, val);
  2269. }
  2270. }
  2271. }
  2272. if ((is_type_struct(a) || is_type_union(a)) && is_type_comparable(a)) {
  2273. return lb_compare_records(p, op_kind, left, right, a);
  2274. }
  2275. if ((is_type_struct(b) || is_type_union(b)) && is_type_comparable(b)) {
  2276. return lb_compare_records(p, op_kind, left, right, b);
  2277. }
  2278. if (is_type_string(a)) {
  2279. if (is_type_cstring(a) && is_type_cstring(b)) {
  2280. left = lb_emit_conv(p, left, t_cstring);
  2281. right = lb_emit_conv(p, right, t_cstring);
  2282. char const *runtime_procedure = nullptr;
  2283. switch (op_kind) {
  2284. case Token_CmpEq: runtime_procedure = "cstring_eq"; break;
  2285. case Token_NotEq: runtime_procedure = "cstring_ne"; break;
  2286. case Token_Lt: runtime_procedure = "cstring_lt"; break;
  2287. case Token_Gt: runtime_procedure = "cstring_gt"; break;
  2288. case Token_LtEq: runtime_procedure = "cstring_le"; break;
  2289. case Token_GtEq: runtime_procedure = "cstring_ge"; break;
  2290. }
  2291. GB_ASSERT(runtime_procedure != nullptr);
  2292. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2293. args[0] = left;
  2294. args[1] = right;
  2295. return lb_emit_runtime_call(p, runtime_procedure, args);
  2296. }
  2297. if (is_type_cstring(a) ^ is_type_cstring(b)) {
  2298. left = lb_emit_conv(p, left, t_string);
  2299. right = lb_emit_conv(p, right, t_string);
  2300. }
  2301. char const *runtime_procedure = nullptr;
  2302. switch (op_kind) {
  2303. case Token_CmpEq: runtime_procedure = "string_eq"; break;
  2304. case Token_NotEq: runtime_procedure = "string_ne"; break;
  2305. case Token_Lt: runtime_procedure = "string_lt"; break;
  2306. case Token_Gt: runtime_procedure = "string_gt"; break;
  2307. case Token_LtEq: runtime_procedure = "string_le"; break;
  2308. case Token_GtEq: runtime_procedure = "string_ge"; break;
  2309. }
  2310. GB_ASSERT(runtime_procedure != nullptr);
  2311. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2312. args[0] = left;
  2313. args[1] = right;
  2314. return lb_emit_runtime_call(p, runtime_procedure, args);
  2315. }
  2316. if (is_type_complex(a)) {
  2317. char const *runtime_procedure = "";
  2318. i64 sz = 8*type_size_of(a);
  2319. switch (sz) {
  2320. case 32:
  2321. switch (op_kind) {
  2322. case Token_CmpEq: runtime_procedure = "complex32_eq"; break;
  2323. case Token_NotEq: runtime_procedure = "complex32_ne"; break;
  2324. }
  2325. break;
  2326. case 64:
  2327. switch (op_kind) {
  2328. case Token_CmpEq: runtime_procedure = "complex64_eq"; break;
  2329. case Token_NotEq: runtime_procedure = "complex64_ne"; break;
  2330. }
  2331. break;
  2332. case 128:
  2333. switch (op_kind) {
  2334. case Token_CmpEq: runtime_procedure = "complex128_eq"; break;
  2335. case Token_NotEq: runtime_procedure = "complex128_ne"; break;
  2336. }
  2337. break;
  2338. }
  2339. GB_ASSERT(runtime_procedure != nullptr);
  2340. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2341. args[0] = left;
  2342. args[1] = right;
  2343. return lb_emit_runtime_call(p, runtime_procedure, args);
  2344. }
  2345. if (is_type_quaternion(a)) {
  2346. char const *runtime_procedure = "";
  2347. i64 sz = 8*type_size_of(a);
  2348. switch (sz) {
  2349. case 64:
  2350. switch (op_kind) {
  2351. case Token_CmpEq: runtime_procedure = "quaternion64_eq"; break;
  2352. case Token_NotEq: runtime_procedure = "quaternion64_ne"; break;
  2353. }
  2354. break;
  2355. case 128:
  2356. switch (op_kind) {
  2357. case Token_CmpEq: runtime_procedure = "quaternion128_eq"; break;
  2358. case Token_NotEq: runtime_procedure = "quaternion128_ne"; break;
  2359. }
  2360. break;
  2361. case 256:
  2362. switch (op_kind) {
  2363. case Token_CmpEq: runtime_procedure = "quaternion256_eq"; break;
  2364. case Token_NotEq: runtime_procedure = "quaternion256_ne"; break;
  2365. }
  2366. break;
  2367. }
  2368. GB_ASSERT(runtime_procedure != nullptr);
  2369. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2370. args[0] = left;
  2371. args[1] = right;
  2372. return lb_emit_runtime_call(p, runtime_procedure, args);
  2373. }
  2374. if (is_type_bit_set(a)) {
  2375. switch (op_kind) {
  2376. case Token_Lt:
  2377. case Token_LtEq:
  2378. case Token_Gt:
  2379. case Token_GtEq:
  2380. {
  2381. Type *it = bit_set_to_int(a);
  2382. lbValue lhs = lb_emit_transmute(p, left, it);
  2383. lbValue rhs = lb_emit_transmute(p, right, it);
  2384. lbValue res = lb_emit_arith(p, Token_And, lhs, rhs, it);
  2385. if (op_kind == Token_Lt || op_kind == Token_LtEq) {
  2386. // (lhs & rhs) == lhs
  2387. res.value = LLVMBuildICmp(p->builder, LLVMIntEQ, res.value, lhs.value, "");
  2388. res.type = t_llvm_bool;
  2389. } else if (op_kind == Token_Gt || op_kind == Token_GtEq) {
  2390. // (lhs & rhs) == rhs
  2391. res.value = LLVMBuildICmp(p->builder, LLVMIntEQ, res.value, rhs.value, "");
  2392. res.type = t_llvm_bool;
  2393. }
  2394. // NOTE(bill): Strict subsets
  2395. if (op_kind == Token_Lt || op_kind == Token_Gt) {
  2396. // res &~ (lhs == rhs)
  2397. lbValue eq = {};
  2398. eq.value = LLVMBuildICmp(p->builder, LLVMIntEQ, lhs.value, rhs.value, "");
  2399. eq.type = t_llvm_bool;
  2400. res = lb_emit_arith(p, Token_AndNot, res, eq, t_llvm_bool);
  2401. }
  2402. return res;
  2403. }
  2404. case Token_CmpEq:
  2405. case Token_NotEq:
  2406. {
  2407. LLVMIntPredicate pred = {};
  2408. switch (op_kind) {
  2409. case Token_CmpEq: pred = LLVMIntEQ; break;
  2410. case Token_NotEq: pred = LLVMIntNE; break;
  2411. }
  2412. lbValue res = {};
  2413. res.type = t_llvm_bool;
  2414. res.value = LLVMBuildICmp(p->builder, pred, left.value, right.value, "");
  2415. return res;
  2416. }
  2417. }
  2418. }
  2419. if (op_kind != Token_CmpEq && op_kind != Token_NotEq) {
  2420. Type *t = left.type;
  2421. if (is_type_integer(t) && is_type_different_to_arch_endianness(t)) {
  2422. Type *platform_type = integer_endian_type_to_platform_type(t);
  2423. lbValue x = lb_emit_byte_swap(p, left, platform_type);
  2424. lbValue y = lb_emit_byte_swap(p, right, platform_type);
  2425. left = x;
  2426. right = y;
  2427. } else if (is_type_float(t) && is_type_different_to_arch_endianness(t)) {
  2428. Type *platform_type = integer_endian_type_to_platform_type(t);
  2429. lbValue x = lb_emit_conv(p, left, platform_type);
  2430. lbValue y = lb_emit_conv(p, right, platform_type);
  2431. left = x;
  2432. right = y;
  2433. }
  2434. }
  2435. a = core_type(left.type);
  2436. b = core_type(right.type);
  2437. lbValue res = {};
  2438. res.type = t_llvm_bool;
  2439. if (is_type_integer(a) ||
  2440. is_type_boolean(a) ||
  2441. is_type_pointer(a) ||
  2442. is_type_multi_pointer(a) ||
  2443. is_type_proc(a) ||
  2444. is_type_enum(a)) {
  2445. LLVMIntPredicate pred = {};
  2446. if (is_type_unsigned(left.type)) {
  2447. switch (op_kind) {
  2448. case Token_Gt: pred = LLVMIntUGT; break;
  2449. case Token_GtEq: pred = LLVMIntUGE; break;
  2450. case Token_Lt: pred = LLVMIntULT; break;
  2451. case Token_LtEq: pred = LLVMIntULE; break;
  2452. }
  2453. } else {
  2454. switch (op_kind) {
  2455. case Token_Gt: pred = LLVMIntSGT; break;
  2456. case Token_GtEq: pred = LLVMIntSGE; break;
  2457. case Token_Lt: pred = LLVMIntSLT; break;
  2458. case Token_LtEq: pred = LLVMIntSLE; break;
  2459. }
  2460. }
  2461. switch (op_kind) {
  2462. case Token_CmpEq: pred = LLVMIntEQ; break;
  2463. case Token_NotEq: pred = LLVMIntNE; break;
  2464. }
  2465. LLVMValueRef lhs = left.value;
  2466. LLVMValueRef rhs = right.value;
  2467. if (LLVMTypeOf(lhs) != LLVMTypeOf(rhs)) {
  2468. if (lb_is_type_kind(LLVMTypeOf(lhs), LLVMPointerTypeKind)) {
  2469. rhs = LLVMBuildPointerCast(p->builder, rhs, LLVMTypeOf(lhs), "");
  2470. }
  2471. }
  2472. res.value = LLVMBuildICmp(p->builder, pred, lhs, rhs, "");
  2473. } else if (is_type_float(a)) {
  2474. LLVMRealPredicate pred = {};
  2475. switch (op_kind) {
  2476. case Token_CmpEq: pred = LLVMRealOEQ; break;
  2477. case Token_Gt: pred = LLVMRealOGT; break;
  2478. case Token_GtEq: pred = LLVMRealOGE; break;
  2479. case Token_Lt: pred = LLVMRealOLT; break;
  2480. case Token_LtEq: pred = LLVMRealOLE; break;
  2481. case Token_NotEq: pred = LLVMRealONE; break;
  2482. }
  2483. res.value = LLVMBuildFCmp(p->builder, pred, left.value, right.value, "");
  2484. } else if (is_type_typeid(a)) {
  2485. LLVMIntPredicate pred = {};
  2486. switch (op_kind) {
  2487. case Token_Gt: pred = LLVMIntUGT; break;
  2488. case Token_GtEq: pred = LLVMIntUGE; break;
  2489. case Token_Lt: pred = LLVMIntULT; break;
  2490. case Token_LtEq: pred = LLVMIntULE; break;
  2491. case Token_CmpEq: pred = LLVMIntEQ; break;
  2492. case Token_NotEq: pred = LLVMIntNE; break;
  2493. }
  2494. res.value = LLVMBuildICmp(p->builder, pred, left.value, right.value, "");
  2495. } else if (is_type_simd_vector(a)) {
  2496. LLVMValueRef mask = nullptr;
  2497. Type *elem = base_array_type(a);
  2498. if (is_type_float(elem)) {
  2499. LLVMRealPredicate pred = {};
  2500. switch (op_kind) {
  2501. case Token_CmpEq: pred = LLVMRealOEQ; break;
  2502. case Token_NotEq: pred = LLVMRealONE; break;
  2503. }
  2504. mask = LLVMBuildFCmp(p->builder, pred, left.value, right.value, "");
  2505. } else {
  2506. LLVMIntPredicate pred = {};
  2507. switch (op_kind) {
  2508. case Token_CmpEq: pred = LLVMIntEQ; break;
  2509. case Token_NotEq: pred = LLVMIntNE; break;
  2510. }
  2511. mask = LLVMBuildICmp(p->builder, pred, left.value, right.value, "");
  2512. }
  2513. GB_ASSERT_MSG(mask != nullptr, "Unhandled comparison kind %s (%s) %.*s %s (%s)", type_to_string(left.type), type_to_string(base_type(left.type)), LIT(token_strings[op_kind]), type_to_string(right.type), type_to_string(base_type(right.type)));
  2514. /* NOTE(bill, 2022-05-28):
  2515. Thanks to Per Vognsen, sign extending <N x i1> to
  2516. a vector of the same width as the input vector, bit casting to an integer,
  2517. and then comparing against zero is the better option
  2518. See: https://lists.llvm.org/pipermail/llvm-dev/2012-September/053046.html
  2519. // Example assuming 128-bit vector
  2520. %1 = <4 x float> ...
  2521. %2 = <4 x float> ...
  2522. %3 = fcmp oeq <4 x float> %1, %2
  2523. %4 = sext <4 x i1> %3 to <4 x i32>
  2524. %5 = bitcast <4 x i32> %4 to i128
  2525. %6 = icmp ne i128 %5, 0
  2526. br i1 %6, label %true1, label %false2
  2527. This will result in 1 cmpps + 1 ptest + 1 br
  2528. (even without SSE4.1, contrary to what the mail list states, because of pmovmskb)
  2529. */
  2530. unsigned count = cast(unsigned)get_array_type_count(a);
  2531. unsigned elem_sz = cast(unsigned)(type_size_of(elem)*8);
  2532. LLVMTypeRef mask_type = LLVMVectorType(LLVMIntTypeInContext(p->module->ctx, elem_sz), count);
  2533. mask = LLVMBuildSExtOrBitCast(p->builder, mask, mask_type, "");
  2534. LLVMTypeRef mask_int_type = LLVMIntTypeInContext(p->module->ctx, cast(unsigned)(8*type_size_of(a)));
  2535. LLVMValueRef mask_int = LLVMBuildBitCast(p->builder, mask, mask_int_type, "");
  2536. res.value = LLVMBuildICmp(p->builder, LLVMIntNE, mask_int, LLVMConstNull(LLVMTypeOf(mask_int)), "");
  2537. return res;
  2538. } else {
  2539. GB_PANIC("Unhandled comparison kind %s (%s) %.*s %s (%s)", type_to_string(left.type), type_to_string(base_type(left.type)), LIT(token_strings[op_kind]), type_to_string(right.type), type_to_string(base_type(right.type)));
  2540. }
  2541. return res;
  2542. }
  2543. gb_internal lbValue lb_emit_comp_against_nil(lbProcedure *p, TokenKind op_kind, lbValue x) {
  2544. lbValue res = {};
  2545. res.type = t_llvm_bool;
  2546. Type *t = x.type;
  2547. Type *bt = base_type(t);
  2548. TypeKind type_kind = bt->kind;
  2549. switch (type_kind) {
  2550. case Type_Basic:
  2551. switch (bt->Basic.kind) {
  2552. case Basic_rawptr:
  2553. case Basic_cstring:
  2554. if (op_kind == Token_CmpEq) {
  2555. res.value = LLVMBuildIsNull(p->builder, x.value, "");
  2556. } else if (op_kind == Token_NotEq) {
  2557. res.value = LLVMBuildIsNotNull(p->builder, x.value, "");
  2558. }
  2559. return res;
  2560. case Basic_any:
  2561. {
  2562. // TODO(bill): is this correct behaviour for nil comparison for any?
  2563. lbValue data = lb_emit_struct_ev(p, x, 0);
  2564. lbValue ti = lb_emit_struct_ev(p, x, 1);
  2565. if (op_kind == Token_CmpEq) {
  2566. LLVMValueRef a = LLVMBuildIsNull(p->builder, data.value, "");
  2567. LLVMValueRef b = LLVMBuildIsNull(p->builder, ti.value, "");
  2568. res.value = LLVMBuildOr(p->builder, a, b, "");
  2569. return res;
  2570. } else if (op_kind == Token_NotEq) {
  2571. LLVMValueRef a = LLVMBuildIsNotNull(p->builder, data.value, "");
  2572. LLVMValueRef b = LLVMBuildIsNotNull(p->builder, ti.value, "");
  2573. res.value = LLVMBuildAnd(p->builder, a, b, "");
  2574. return res;
  2575. }
  2576. }
  2577. break;
  2578. case Basic_typeid:
  2579. lbValue invalid_typeid = lb_const_value(p->module, t_typeid, exact_value_i64(0));
  2580. return lb_emit_comp(p, op_kind, x, invalid_typeid);
  2581. }
  2582. break;
  2583. case Type_Enum:
  2584. case Type_Pointer:
  2585. case Type_MultiPointer:
  2586. case Type_Proc:
  2587. if (op_kind == Token_CmpEq) {
  2588. res.value = LLVMBuildIsNull(p->builder, x.value, "");
  2589. } else if (op_kind == Token_NotEq) {
  2590. res.value = LLVMBuildIsNotNull(p->builder, x.value, "");
  2591. }
  2592. return res;
  2593. case Type_BitSet:
  2594. {
  2595. Type *u = bit_set_to_int(bt);
  2596. if (is_type_array(u)) {
  2597. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2598. lbValue lhs = lb_address_from_load_or_generate_local(p, x);
  2599. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2600. args[1] = lb_const_int(p->module, t_int, type_size_of(t));
  2601. lbValue val = lb_emit_runtime_call(p, "memory_compare_zero", args);
  2602. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_int(p->module, t_int, 0));
  2603. return res;
  2604. } else {
  2605. if (op_kind == Token_CmpEq) {
  2606. res.value = LLVMBuildIsNull(p->builder, x.value, "");
  2607. } else if (op_kind == Token_NotEq) {
  2608. res.value = LLVMBuildIsNotNull(p->builder, x.value, "");
  2609. }
  2610. }
  2611. return res;
  2612. }
  2613. case Type_Slice:
  2614. {
  2615. lbValue data = lb_emit_struct_ev(p, x, 0);
  2616. if (op_kind == Token_CmpEq) {
  2617. res.value = LLVMBuildIsNull(p->builder, data.value, "");
  2618. return res;
  2619. } else if (op_kind == Token_NotEq) {
  2620. res.value = LLVMBuildIsNotNull(p->builder, data.value, "");
  2621. return res;
  2622. }
  2623. }
  2624. break;
  2625. case Type_DynamicArray:
  2626. {
  2627. lbValue data = lb_emit_struct_ev(p, x, 0);
  2628. if (op_kind == Token_CmpEq) {
  2629. res.value = LLVMBuildIsNull(p->builder, data.value, "");
  2630. return res;
  2631. } else if (op_kind == Token_NotEq) {
  2632. res.value = LLVMBuildIsNotNull(p->builder, data.value, "");
  2633. return res;
  2634. }
  2635. }
  2636. break;
  2637. case Type_Map:
  2638. {
  2639. lbValue data_ptr = lb_emit_struct_ev(p, x, 0);
  2640. if (op_kind == Token_CmpEq) {
  2641. res.value = LLVMBuildIsNull(p->builder, data_ptr.value, "");
  2642. return res;
  2643. } else {
  2644. res.value = LLVMBuildIsNotNull(p->builder, data_ptr.value, "");
  2645. return res;
  2646. }
  2647. }
  2648. break;
  2649. case Type_Union:
  2650. {
  2651. if (type_size_of(t) == 0) {
  2652. if (op_kind == Token_CmpEq) {
  2653. return lb_const_bool(p->module, t_llvm_bool, true);
  2654. } else if (op_kind == Token_NotEq) {
  2655. return lb_const_bool(p->module, t_llvm_bool, false);
  2656. }
  2657. } else if (is_type_union_maybe_pointer(t)) {
  2658. lbValue tag = lb_emit_transmute(p, x, t_rawptr);
  2659. return lb_emit_comp_against_nil(p, op_kind, tag);
  2660. } else {
  2661. lbValue tag = lb_emit_union_tag_value(p, x);
  2662. return lb_emit_comp(p, op_kind, tag, lb_zero(p->module, tag.type));
  2663. }
  2664. }
  2665. case Type_Struct:
  2666. if (is_type_soa_struct(t)) {
  2667. Type *bt = base_type(t);
  2668. if (bt->Struct.soa_kind == StructSoa_Slice) {
  2669. LLVMValueRef the_value = {};
  2670. if (bt->Struct.fields.count == 0) {
  2671. lbValue len = lb_soa_struct_len(p, x);
  2672. the_value = len.value;
  2673. } else {
  2674. lbValue first_field = lb_emit_struct_ev(p, x, 0);
  2675. the_value = first_field.value;
  2676. }
  2677. if (op_kind == Token_CmpEq) {
  2678. res.value = LLVMBuildIsNull(p->builder, the_value, "");
  2679. return res;
  2680. } else if (op_kind == Token_NotEq) {
  2681. res.value = LLVMBuildIsNotNull(p->builder, the_value, "");
  2682. return res;
  2683. }
  2684. } else if (bt->Struct.soa_kind == StructSoa_Dynamic) {
  2685. LLVMValueRef the_value = {};
  2686. if (bt->Struct.fields.count == 0) {
  2687. lbValue cap = lb_soa_struct_cap(p, x);
  2688. the_value = cap.value;
  2689. } else {
  2690. lbValue first_field = lb_emit_struct_ev(p, x, 0);
  2691. the_value = first_field.value;
  2692. }
  2693. if (op_kind == Token_CmpEq) {
  2694. res.value = LLVMBuildIsNull(p->builder, the_value, "");
  2695. return res;
  2696. } else if (op_kind == Token_NotEq) {
  2697. res.value = LLVMBuildIsNotNull(p->builder, the_value, "");
  2698. return res;
  2699. }
  2700. }
  2701. } else if (is_type_struct(t) && type_has_nil(t)) {
  2702. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2703. lbValue lhs = lb_address_from_load_or_generate_local(p, x);
  2704. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2705. args[1] = lb_const_int(p->module, t_int, type_size_of(t));
  2706. lbValue val = lb_emit_runtime_call(p, "memory_compare_zero", args);
  2707. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_int(p->module, t_int, 0));
  2708. return res;
  2709. }
  2710. break;
  2711. }
  2712. GB_PANIC("Unknown handled type: %s -> %s", type_to_string(t), type_to_string(bt));
  2713. return {};
  2714. }
  2715. gb_internal lbValue lb_build_unary_and(lbProcedure *p, Ast *expr) {
  2716. ast_node(ue, UnaryExpr, expr);
  2717. auto tv = type_and_value_of_expr(expr);
  2718. Ast *ue_expr = unparen_expr(ue->expr);
  2719. if (ue_expr->kind == Ast_IndexExpr && tv.mode == Addressing_OptionalOkPtr && is_type_tuple(tv.type)) {
  2720. Type *tuple = tv.type;
  2721. Type *map_type = type_of_expr(ue_expr->IndexExpr.expr);
  2722. Type *ot = base_type(map_type);
  2723. Type *t = base_type(type_deref(ot));
  2724. bool deref = t != ot;
  2725. GB_ASSERT(t->kind == Type_Map);
  2726. ast_node(ie, IndexExpr, ue_expr);
  2727. lbValue map_val = lb_build_addr_ptr(p, ie->expr);
  2728. if (deref) {
  2729. map_val = lb_emit_load(p, map_val);
  2730. }
  2731. lbValue key = lb_build_expr(p, ie->index);
  2732. key = lb_emit_conv(p, key, t->Map.key);
  2733. lbAddr addr = lb_addr_map(map_val, key, t, alloc_type_pointer(t->Map.value));
  2734. lbValue ptr = lb_addr_get_ptr(p, addr);
  2735. lbValue ok = lb_emit_comp_against_nil(p, Token_NotEq, ptr);
  2736. ok = lb_emit_conv(p, ok, tuple->Tuple.variables[1]->type);
  2737. lbAddr res = lb_add_local_generated(p, tuple, false);
  2738. lbValue gep0 = lb_emit_struct_ep(p, res.addr, 0);
  2739. lbValue gep1 = lb_emit_struct_ep(p, res.addr, 1);
  2740. lb_emit_store(p, gep0, ptr);
  2741. lb_emit_store(p, gep1, ok);
  2742. return lb_addr_load(p, res);
  2743. } else if (is_type_soa_pointer(tv.type)) {
  2744. ast_node(ie, IndexExpr, ue_expr);
  2745. lbValue addr = lb_build_addr_ptr(p, ie->expr);
  2746. if (is_type_pointer(type_deref(addr.type))) {
  2747. addr = lb_emit_load(p, addr);
  2748. }
  2749. GB_ASSERT(is_type_pointer(addr.type));
  2750. lbValue index = lb_build_expr(p, ie->index);
  2751. if (!build_context.no_bounds_check) {
  2752. // TODO(bill): soa bounds checking
  2753. }
  2754. return lb_make_soa_pointer(p, tv.type, addr, index);
  2755. } else if (ue_expr->kind == Ast_CompoundLit) {
  2756. lbValue v = lb_build_expr(p, ue->expr);
  2757. Type *type = v.type;
  2758. lbAddr addr = {};
  2759. if (p->is_startup) {
  2760. addr = lb_add_global_generated(p->module, type, v);
  2761. } else {
  2762. addr = lb_add_local_generated(p, type, false);
  2763. }
  2764. lb_addr_store(p, addr, v);
  2765. return addr.addr;
  2766. } else if (ue_expr->kind == Ast_TypeAssertion) {
  2767. if (is_type_tuple(tv.type)) {
  2768. Type *tuple = tv.type;
  2769. Type *ptr_type = tuple->Tuple.variables[0]->type;
  2770. Type *ok_type = tuple->Tuple.variables[1]->type;
  2771. ast_node(ta, TypeAssertion, ue_expr);
  2772. TokenPos pos = ast_token(expr).pos;
  2773. Type *type = type_of_expr(ue_expr);
  2774. GB_ASSERT(!is_type_tuple(type));
  2775. lbValue e = lb_build_expr(p, ta->expr);
  2776. Type *t = type_deref(e.type);
  2777. if (is_type_union(t)) {
  2778. lbValue v = e;
  2779. if (!is_type_pointer(v.type)) {
  2780. v = lb_address_from_load_or_generate_local(p, v);
  2781. }
  2782. Type *src_type = type_deref(v.type);
  2783. Type *dst_type = type;
  2784. lbValue src_tag = {};
  2785. lbValue dst_tag = {};
  2786. if (is_type_union_maybe_pointer(src_type)) {
  2787. src_tag = lb_emit_comp_against_nil(p, Token_NotEq, v);
  2788. dst_tag = lb_const_bool(p->module, t_bool, true);
  2789. } else {
  2790. src_tag = lb_emit_load(p, lb_emit_union_tag_ptr(p, v));
  2791. dst_tag = lb_const_union_tag(p->module, src_type, dst_type);
  2792. }
  2793. lbValue ok = lb_emit_comp(p, Token_CmpEq, src_tag, dst_tag);
  2794. lbValue data_ptr = lb_emit_conv(p, v, ptr_type);
  2795. lbAddr res = lb_add_local_generated(p, tuple, true);
  2796. lbValue gep0 = lb_emit_struct_ep(p, res.addr, 0);
  2797. lbValue gep1 = lb_emit_struct_ep(p, res.addr, 1);
  2798. lb_emit_store(p, gep0, lb_emit_select(p, ok, data_ptr, lb_const_nil(p->module, ptr_type)));
  2799. lb_emit_store(p, gep1, lb_emit_conv(p, ok, ok_type));
  2800. return lb_addr_load(p, res);
  2801. } else if (is_type_any(t)) {
  2802. lbValue v = e;
  2803. if (is_type_pointer(v.type)) {
  2804. v = lb_emit_load(p, v);
  2805. }
  2806. lbValue data_ptr = lb_emit_conv(p, lb_emit_struct_ev(p, v, 0), ptr_type);
  2807. lbValue any_id = lb_emit_struct_ev(p, v, 1);
  2808. lbValue id = lb_typeid(p->module, type);
  2809. lbValue ok = lb_emit_comp(p, Token_CmpEq, any_id, id);
  2810. lbAddr res = lb_add_local_generated(p, tuple, false);
  2811. lbValue gep0 = lb_emit_struct_ep(p, res.addr, 0);
  2812. lbValue gep1 = lb_emit_struct_ep(p, res.addr, 1);
  2813. lb_emit_store(p, gep0, lb_emit_select(p, ok, data_ptr, lb_const_nil(p->module, ptr_type)));
  2814. lb_emit_store(p, gep1, lb_emit_conv(p, ok, ok_type));
  2815. return lb_addr_load(p, res);
  2816. } else {
  2817. GB_PANIC("TODO(bill): type assertion %s", type_to_string(type));
  2818. }
  2819. } else {
  2820. GB_ASSERT(is_type_pointer(tv.type));
  2821. ast_node(ta, TypeAssertion, ue_expr);
  2822. TokenPos pos = ast_token(expr).pos;
  2823. Type *type = type_of_expr(ue_expr);
  2824. GB_ASSERT(!is_type_tuple(type));
  2825. lbValue e = lb_build_expr(p, ta->expr);
  2826. Type *t = type_deref(e.type);
  2827. if (is_type_union(t)) {
  2828. lbValue v = e;
  2829. if (!is_type_pointer(v.type)) {
  2830. v = lb_address_from_load_or_generate_local(p, v);
  2831. }
  2832. Type *src_type = type_deref(v.type);
  2833. Type *dst_type = type;
  2834. if (!build_context.no_type_assert && (p->state_flags & StateFlag_no_type_assert) == 0) {
  2835. lbValue src_tag = {};
  2836. lbValue dst_tag = {};
  2837. if (is_type_union_maybe_pointer(src_type)) {
  2838. src_tag = lb_emit_comp_against_nil(p, Token_NotEq, v);
  2839. dst_tag = lb_const_bool(p->module, t_bool, true);
  2840. } else {
  2841. src_tag = lb_emit_load(p, lb_emit_union_tag_ptr(p, v));
  2842. dst_tag = lb_const_union_tag(p->module, src_type, dst_type);
  2843. }
  2844. isize arg_count = 6;
  2845. if (build_context.no_rtti) {
  2846. arg_count = 4;
  2847. }
  2848. lbValue ok = lb_emit_comp(p, Token_CmpEq, src_tag, dst_tag);
  2849. auto args = array_make<lbValue>(permanent_allocator(), arg_count);
  2850. args[0] = ok;
  2851. args[1] = lb_find_or_add_entity_string(p->module, get_file_path_string(pos.file_id));
  2852. args[2] = lb_const_int(p->module, t_i32, pos.line);
  2853. args[3] = lb_const_int(p->module, t_i32, pos.column);
  2854. if (!build_context.no_rtti) {
  2855. args[4] = lb_typeid(p->module, src_type);
  2856. args[5] = lb_typeid(p->module, dst_type);
  2857. }
  2858. lb_emit_runtime_call(p, "type_assertion_check", args);
  2859. }
  2860. lbValue data_ptr = v;
  2861. return lb_emit_conv(p, data_ptr, tv.type);
  2862. } else if (is_type_any(t)) {
  2863. lbValue v = e;
  2864. if (is_type_pointer(v.type)) {
  2865. v = lb_emit_load(p, v);
  2866. }
  2867. lbValue data_ptr = lb_emit_struct_ev(p, v, 0);
  2868. if (!build_context.no_type_assert && (p->state_flags & StateFlag_no_type_assert) == 0) {
  2869. GB_ASSERT(!build_context.no_rtti);
  2870. lbValue any_id = lb_emit_struct_ev(p, v, 1);
  2871. lbValue id = lb_typeid(p->module, type);
  2872. lbValue ok = lb_emit_comp(p, Token_CmpEq, any_id, id);
  2873. auto args = array_make<lbValue>(permanent_allocator(), 6);
  2874. args[0] = ok;
  2875. args[1] = lb_find_or_add_entity_string(p->module, get_file_path_string(pos.file_id));
  2876. args[2] = lb_const_int(p->module, t_i32, pos.line);
  2877. args[3] = lb_const_int(p->module, t_i32, pos.column);
  2878. args[4] = any_id;
  2879. args[5] = id;
  2880. lb_emit_runtime_call(p, "type_assertion_check", args);
  2881. }
  2882. return lb_emit_conv(p, data_ptr, tv.type);
  2883. } else {
  2884. GB_PANIC("TODO(bill): type assertion %s", type_to_string(type));
  2885. }
  2886. }
  2887. }
  2888. return lb_build_addr_ptr(p, ue->expr);
  2889. }
  2890. gb_internal lbValue lb_build_expr_internal(lbProcedure *p, Ast *expr);
  2891. gb_internal lbValue lb_build_expr(lbProcedure *p, Ast *expr) {
  2892. u16 prev_state_flags = p->state_flags;
  2893. defer (p->state_flags = prev_state_flags);
  2894. if (expr->state_flags != 0) {
  2895. u16 in = expr->state_flags;
  2896. u16 out = p->state_flags;
  2897. if (in & StateFlag_bounds_check) {
  2898. out |= StateFlag_bounds_check;
  2899. out &= ~StateFlag_no_bounds_check;
  2900. } else if (in & StateFlag_no_bounds_check) {
  2901. out |= StateFlag_no_bounds_check;
  2902. out &= ~StateFlag_bounds_check;
  2903. }
  2904. if (in & StateFlag_type_assert) {
  2905. out |= StateFlag_type_assert;
  2906. out &= ~StateFlag_no_type_assert;
  2907. } else if (in & StateFlag_no_type_assert) {
  2908. out |= StateFlag_no_type_assert;
  2909. out &= ~StateFlag_type_assert;
  2910. }
  2911. p->state_flags = out;
  2912. }
  2913. // IMPORTANT NOTE(bill):
  2914. // Selector Call Expressions (foo->bar(...))
  2915. // must only evaluate `foo` once as it gets transformed into
  2916. // `foo.bar(foo, ...)`
  2917. // And if `foo` is a procedure call or something more complex, storing the value
  2918. // once is a very good idea
  2919. // If a stored value is found, it must be removed from the cache
  2920. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  2921. lbValue *pp = map_get(&p->selector_values, expr);
  2922. if (pp != nullptr) {
  2923. lbValue res = *pp;
  2924. map_remove(&p->selector_values, expr);
  2925. return res;
  2926. }
  2927. lbAddr *pa = map_get(&p->selector_addr, expr);
  2928. if (pa != nullptr) {
  2929. lbAddr res = *pa;
  2930. map_remove(&p->selector_addr, expr);
  2931. return lb_addr_load(p, res);
  2932. }
  2933. }
  2934. lbValue res = lb_build_expr_internal(p, expr);
  2935. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  2936. map_set(&p->selector_values, expr, res);
  2937. }
  2938. return res;
  2939. }
  2940. gb_internal lbValue lb_build_expr_internal(lbProcedure *p, Ast *expr) {
  2941. lbModule *m = p->module;
  2942. expr = unparen_expr(expr);
  2943. TokenPos expr_pos = ast_token(expr).pos;
  2944. TypeAndValue tv = type_and_value_of_expr(expr);
  2945. Type *type = type_of_expr(expr);
  2946. GB_ASSERT_MSG(tv.mode != Addressing_Invalid, "invalid expression '%s' (tv.mode = %d, tv.type = %s) @ %s\n Current Proc: %.*s : %s", expr_to_string(expr), tv.mode, type_to_string(tv.type), token_pos_to_string(expr_pos), LIT(p->name), type_to_string(p->type));
  2947. if (tv.value.kind != ExactValue_Invalid) {
  2948. // NOTE(bill): Short on constant values
  2949. return lb_const_value(p->module, type, tv.value);
  2950. } else if (tv.mode == Addressing_Type) {
  2951. // NOTE(bill, 2023-01-16): is this correct? I hope so at least
  2952. return lb_typeid(m, tv.type);
  2953. }
  2954. switch (expr->kind) {
  2955. case_ast_node(bl, BasicLit, expr);
  2956. TokenPos pos = bl->token.pos;
  2957. GB_PANIC("Non-constant basic literal %s - %.*s", token_pos_to_string(pos), LIT(token_strings[bl->token.kind]));
  2958. case_end;
  2959. case_ast_node(bd, BasicDirective, expr);
  2960. TokenPos pos = bd->token.pos;
  2961. GB_PANIC("Non-constant basic literal %s - %.*s", token_pos_to_string(pos), LIT(bd->name.string));
  2962. case_end;
  2963. case_ast_node(i, Implicit, expr);
  2964. return lb_addr_load(p, lb_build_addr(p, expr));
  2965. case_end;
  2966. case_ast_node(u, Uninit, expr)
  2967. lbValue res = {};
  2968. if (is_type_untyped(type)) {
  2969. res.value = nullptr;
  2970. res.type = t_untyped_uninit;
  2971. } else {
  2972. res.value = LLVMGetUndef(lb_type(m, type));
  2973. res.type = type;
  2974. }
  2975. return res;
  2976. case_end;
  2977. case_ast_node(i, Ident, expr);
  2978. Entity *e = entity_from_expr(expr);
  2979. e = strip_entity_wrapping(e);
  2980. GB_ASSERT_MSG(e != nullptr, "%s in %.*s %p", expr_to_string(expr), LIT(p->name), expr);
  2981. if (e->kind == Entity_Builtin) {
  2982. Token token = ast_token(expr);
  2983. GB_PANIC("TODO(bill): lb_build_expr Entity_Builtin '%.*s'\n"
  2984. "\t at %s", LIT(builtin_procs[e->Builtin.id].name),
  2985. token_pos_to_string(token.pos));
  2986. return {};
  2987. } else if (e->kind == Entity_Nil) {
  2988. lbValue res = {};
  2989. res.value = nullptr;
  2990. res.type = e->type;
  2991. return res;
  2992. }
  2993. GB_ASSERT(e->kind != Entity_ProcGroup);
  2994. return lb_find_ident(p, m, e, expr);
  2995. case_end;
  2996. case_ast_node(de, DerefExpr, expr);
  2997. return lb_addr_load(p, lb_build_addr(p, expr));
  2998. case_end;
  2999. case_ast_node(se, SelectorExpr, expr);
  3000. TypeAndValue tav = type_and_value_of_expr(expr);
  3001. GB_ASSERT(tav.mode != Addressing_Invalid);
  3002. return lb_addr_load(p, lb_build_addr(p, expr));
  3003. case_end;
  3004. case_ast_node(ise, ImplicitSelectorExpr, expr);
  3005. TypeAndValue tav = type_and_value_of_expr(expr);
  3006. GB_ASSERT(tav.mode == Addressing_Constant);
  3007. return lb_const_value(p->module, type, tv.value);
  3008. case_end;
  3009. case_ast_node(se, SelectorCallExpr, expr);
  3010. GB_ASSERT(se->modified_call);
  3011. return lb_build_call_expr(p, se->call);
  3012. case_end;
  3013. case_ast_node(te, TernaryIfExpr, expr);
  3014. LLVMValueRef incoming_values[2] = {};
  3015. LLVMBasicBlockRef incoming_blocks[2] = {};
  3016. GB_ASSERT(te->y != nullptr);
  3017. lbBlock *then = lb_create_block(p, "if.then");
  3018. lbBlock *done = lb_create_block(p, "if.done"); // NOTE(bill): Append later
  3019. lbBlock *else_ = lb_create_block(p, "if.else");
  3020. lb_build_cond(p, te->cond, then, else_);
  3021. lb_start_block(p, then);
  3022. Type *type = default_type(type_of_expr(expr));
  3023. LLVMTypeRef llvm_type = lb_type(p->module, type);
  3024. incoming_values[0] = lb_emit_conv(p, lb_build_expr(p, te->x), type).value;
  3025. if (is_type_internally_pointer_like(type)) {
  3026. incoming_values[0] = LLVMBuildBitCast(p->builder, incoming_values[0], llvm_type, "");
  3027. }
  3028. lb_emit_jump(p, done);
  3029. lb_start_block(p, else_);
  3030. incoming_values[1] = lb_emit_conv(p, lb_build_expr(p, te->y), type).value;
  3031. if (is_type_internally_pointer_like(type)) {
  3032. incoming_values[1] = LLVMBuildBitCast(p->builder, incoming_values[1], llvm_type, "");
  3033. }
  3034. lb_emit_jump(p, done);
  3035. lb_start_block(p, done);
  3036. lbValue res = {};
  3037. res.value = LLVMBuildPhi(p->builder, llvm_type, "");
  3038. res.type = type;
  3039. GB_ASSERT(p->curr_block->preds.count >= 2);
  3040. incoming_blocks[0] = p->curr_block->preds[0]->block;
  3041. incoming_blocks[1] = p->curr_block->preds[1]->block;
  3042. LLVMAddIncoming(res.value, incoming_values, incoming_blocks, 2);
  3043. return res;
  3044. case_end;
  3045. case_ast_node(te, TernaryWhenExpr, expr);
  3046. TypeAndValue tav = type_and_value_of_expr(te->cond);
  3047. GB_ASSERT(tav.mode == Addressing_Constant);
  3048. GB_ASSERT(tav.value.kind == ExactValue_Bool);
  3049. if (tav.value.value_bool) {
  3050. return lb_build_expr(p, te->x);
  3051. } else {
  3052. return lb_build_expr(p, te->y);
  3053. }
  3054. case_end;
  3055. case_ast_node(oe, OrElseExpr, expr);
  3056. return lb_emit_or_else(p, oe->x, oe->y, tv);
  3057. case_end;
  3058. case_ast_node(oe, OrReturnExpr, expr);
  3059. return lb_emit_or_return(p, oe->expr, tv);
  3060. case_end;
  3061. case_ast_node(be, OrBranchExpr, expr);
  3062. lbBlock *block = nullptr;
  3063. if (be->label != nullptr) {
  3064. lbBranchBlocks bb = lb_lookup_branch_blocks(p, be->label);
  3065. switch (be->token.kind) {
  3066. case Token_or_break: block = bb.break_; break;
  3067. case Token_or_continue: block = bb.continue_; break;
  3068. }
  3069. } else {
  3070. for (lbTargetList *t = p->target_list; t != nullptr && block == nullptr; t = t->prev) {
  3071. if (t->is_block) {
  3072. continue;
  3073. }
  3074. switch (be->token.kind) {
  3075. case Token_or_break: block = t->break_; break;
  3076. case Token_or_continue: block = t->continue_; break;
  3077. }
  3078. }
  3079. }
  3080. GB_ASSERT(block != nullptr);
  3081. lbValue lhs = {};
  3082. lbValue rhs = {};
  3083. lb_emit_try_lhs_rhs(p, be->expr, tv, &lhs, &rhs);
  3084. Type *type = default_type(tv.type);
  3085. if (lhs.value) {
  3086. lhs = lb_emit_conv(p, lhs, type);
  3087. } else if (type != nullptr && type != t_invalid) {
  3088. lhs = lb_const_nil(p->module, type);
  3089. }
  3090. lbBlock *then = lb_create_block(p, "or_branch.then");
  3091. lbBlock *else_ = lb_create_block(p, "or_branch.else");
  3092. lb_emit_if(p, lb_emit_try_has_value(p, rhs), then, else_);
  3093. lb_start_block(p, else_);
  3094. lb_emit_defer_stmts(p, lbDeferExit_Branch, block);
  3095. lb_emit_jump(p, block);
  3096. lb_start_block(p, then);
  3097. return lhs;
  3098. case_end;
  3099. case_ast_node(ta, TypeAssertion, expr);
  3100. TokenPos pos = ast_token(expr).pos;
  3101. lbValue e = lb_build_expr(p, ta->expr);
  3102. Type *t = type_deref(e.type);
  3103. if (is_type_union(t)) {
  3104. if (ta->ignores[0]) {
  3105. // NOTE(bill): This is not needed for optimization levels other than 0
  3106. return lb_emit_union_cast_only_ok_check(p, e, type, pos);
  3107. }
  3108. return lb_emit_union_cast(p, e, type, pos);
  3109. } else if (is_type_any(t)) {
  3110. return lb_emit_any_cast(p, e, type, pos);
  3111. } else {
  3112. GB_PANIC("TODO(bill): type assertion %s", type_to_string(e.type));
  3113. }
  3114. case_end;
  3115. case_ast_node(tc, TypeCast, expr);
  3116. lbValue e = lb_build_expr(p, tc->expr);
  3117. switch (tc->token.kind) {
  3118. case Token_cast:
  3119. return lb_emit_conv(p, e, type);
  3120. case Token_transmute:
  3121. return lb_emit_transmute(p, e, type);
  3122. }
  3123. GB_PANIC("Invalid AST TypeCast");
  3124. case_end;
  3125. case_ast_node(ac, AutoCast, expr);
  3126. lbValue value = lb_build_expr(p, ac->expr);
  3127. return lb_emit_conv(p, value, type);
  3128. case_end;
  3129. case_ast_node(ue, UnaryExpr, expr);
  3130. switch (ue->op.kind) {
  3131. case Token_And:
  3132. return lb_build_unary_and(p, expr);
  3133. default:
  3134. {
  3135. lbValue v = lb_build_expr(p, ue->expr);
  3136. return lb_emit_unary_arith(p, ue->op.kind, v, type);
  3137. }
  3138. }
  3139. case_end;
  3140. case_ast_node(be, BinaryExpr, expr);
  3141. return lb_build_binary_expr(p, expr);
  3142. case_end;
  3143. case_ast_node(pl, ProcLit, expr);
  3144. return lb_generate_anonymous_proc_lit(p->module, p->name, expr, p);
  3145. case_end;
  3146. case_ast_node(cl, CompoundLit, expr);
  3147. return lb_addr_load(p, lb_build_addr(p, expr));
  3148. case_end;
  3149. case_ast_node(ce, CallExpr, expr);
  3150. return lb_build_call_expr(p, expr);
  3151. case_end;
  3152. case_ast_node(se, SliceExpr, expr);
  3153. if (is_type_slice(type_of_expr(se->expr))) {
  3154. // NOTE(bill): Quick optimization
  3155. if (se->high == nullptr &&
  3156. (se->low == nullptr || lb_is_expr_constant_zero(se->low))) {
  3157. return lb_build_expr(p, se->expr);
  3158. }
  3159. }
  3160. return lb_addr_load(p, lb_build_addr(p, expr));
  3161. case_end;
  3162. case_ast_node(ie, IndexExpr, expr);
  3163. return lb_addr_load(p, lb_build_addr(p, expr));
  3164. case_end;
  3165. case_ast_node(ie, MatrixIndexExpr, expr);
  3166. return lb_addr_load(p, lb_build_addr(p, expr));
  3167. case_end;
  3168. case_ast_node(ia, InlineAsmExpr, expr);
  3169. Type *t = type_of_expr(expr);
  3170. GB_ASSERT(is_type_asm_proc(t));
  3171. String asm_string = {};
  3172. String constraints_string = {};
  3173. TypeAndValue tav;
  3174. tav = type_and_value_of_expr(ia->asm_string);
  3175. GB_ASSERT(is_type_string(tav.type));
  3176. GB_ASSERT(tav.value.kind == ExactValue_String);
  3177. asm_string = tav.value.value_string;
  3178. tav = type_and_value_of_expr(ia->constraints_string);
  3179. GB_ASSERT(is_type_string(tav.type));
  3180. GB_ASSERT(tav.value.kind == ExactValue_String);
  3181. constraints_string = tav.value.value_string;
  3182. LLVMInlineAsmDialect dialect = LLVMInlineAsmDialectATT;
  3183. switch (ia->dialect) {
  3184. case InlineAsmDialect_Default: dialect = LLVMInlineAsmDialectATT; break;
  3185. case InlineAsmDialect_ATT: dialect = LLVMInlineAsmDialectATT; break;
  3186. case InlineAsmDialect_Intel: dialect = LLVMInlineAsmDialectIntel; break;
  3187. default: GB_PANIC("Unhandled inline asm dialect"); break;
  3188. }
  3189. LLVMTypeRef func_type = lb_type_internal_for_procedures_raw(p->module, t);
  3190. LLVMValueRef the_asm = llvm_get_inline_asm(func_type, asm_string, constraints_string, ia->has_side_effects, ia->has_side_effects, dialect);
  3191. GB_ASSERT(the_asm != nullptr);
  3192. return {the_asm, t};
  3193. case_end;
  3194. }
  3195. GB_PANIC("lb_build_expr: %.*s", LIT(ast_strings[expr->kind]));
  3196. return {};
  3197. }
  3198. gb_internal lbAddr lb_get_soa_variable_addr(lbProcedure *p, Entity *e) {
  3199. return map_must_get(&p->module->soa_values, e);
  3200. }
  3201. gb_internal lbValue lb_get_using_variable(lbProcedure *p, Entity *e) {
  3202. GB_ASSERT(e->kind == Entity_Variable && e->flags & EntityFlag_Using);
  3203. String name = e->token.string;
  3204. Entity *parent = e->using_parent;
  3205. Selection sel = lookup_field(parent->type, name, false);
  3206. GB_ASSERT(sel.entity != nullptr);
  3207. lbValue *pv = map_get(&p->module->values, parent);
  3208. lbValue v = {};
  3209. bool is_soa = false;
  3210. if (pv == nullptr && parent->flags & EntityFlag_SoaPtrField) {
  3211. is_soa = true;
  3212. // NOTE(bill): using SOA value (probably from for-in statement)
  3213. lbAddr parent_addr = lb_get_soa_variable_addr(p, parent);
  3214. v = lb_addr_get_ptr(p, parent_addr);
  3215. } else if (pv != nullptr) {
  3216. v = *pv;
  3217. } else {
  3218. GB_ASSERT_MSG(e->using_expr != nullptr, "%.*s", LIT(name));
  3219. v = lb_build_addr_ptr(p, e->using_expr);
  3220. }
  3221. GB_ASSERT(v.value != nullptr);
  3222. GB_ASSERT_MSG(is_soa || parent->type == type_deref(v.type), "%s %s", type_to_string(parent->type), type_to_string(v.type));
  3223. lbValue ptr = lb_emit_deep_field_gep(p, v, sel);
  3224. if (parent->scope) {
  3225. if ((parent->scope->flags & (ScopeFlag_File|ScopeFlag_Pkg)) == 0) {
  3226. lb_add_debug_local_variable(p, ptr.value, e->type, e->token);
  3227. }
  3228. } else {
  3229. lb_add_debug_local_variable(p, ptr.value, e->type, e->token);
  3230. }
  3231. return ptr;
  3232. }
  3233. gb_internal lbAddr lb_build_addr_from_entity(lbProcedure *p, Entity *e, Ast *expr) {
  3234. GB_ASSERT(e != nullptr);
  3235. if (e->kind == Entity_Constant) {
  3236. Type *t = default_type(type_of_expr(expr));
  3237. lbValue v = lb_const_value(p->module, t, e->Constant.value);
  3238. if (LLVMIsConstant(v.value)) {
  3239. lbAddr g = lb_add_global_generated(p->module, t, v);
  3240. return g;
  3241. }
  3242. GB_ASSERT(LLVMIsALoadInst(v.value));
  3243. lbValue ptr = {};
  3244. ptr.value = LLVMGetOperand(v.value, 0);
  3245. ptr.type = alloc_type_pointer(t);
  3246. return lb_addr(ptr);
  3247. }
  3248. lbValue v = {};
  3249. lbValue *found = map_get(&p->module->values, e);
  3250. if (found) {
  3251. v = *found;
  3252. } else if (e->kind == Entity_Variable && e->flags & EntityFlag_Using) {
  3253. // NOTE(bill): Calculate the using variable every time
  3254. v = lb_get_using_variable(p, e);
  3255. } else if (e->flags & EntityFlag_SoaPtrField) {
  3256. return lb_get_soa_variable_addr(p, e);
  3257. }
  3258. if (v.value == nullptr) {
  3259. return lb_addr(lb_find_value_from_entity(p->module, e));
  3260. // error(expr, "%.*s Unknown value: %.*s, entity: %p %.*s",
  3261. // LIT(p->name),
  3262. // LIT(e->token.string), e, LIT(entity_strings[e->kind]));
  3263. // GB_PANIC("Unknown value");
  3264. }
  3265. return lb_addr(v);
  3266. }
  3267. gb_internal lbAddr lb_build_array_swizzle_addr(lbProcedure *p, AstCallExpr *ce, TypeAndValue const &tv) {
  3268. isize index_count = ce->args.count-1;
  3269. lbAddr addr = lb_build_addr(p, ce->args[0]);
  3270. if (index_count == 0) {
  3271. return addr;
  3272. }
  3273. Type *type = base_type(lb_addr_type(addr));
  3274. GB_ASSERT(type->kind == Type_Array);
  3275. i64 count = type->Array.count;
  3276. if (count <= 4 && index_count <= 4) {
  3277. u8 indices[4] = {};
  3278. u8 index_count = 0;
  3279. for (i32 i = 1; i < ce->args.count; i++) {
  3280. TypeAndValue tv = type_and_value_of_expr(ce->args[i]);
  3281. GB_ASSERT(is_type_integer(tv.type));
  3282. GB_ASSERT(tv.value.kind == ExactValue_Integer);
  3283. i64 src_index = big_int_to_i64(&tv.value.value_integer);
  3284. indices[index_count++] = cast(u8)src_index;
  3285. }
  3286. return lb_addr_swizzle(lb_addr_get_ptr(p, addr), tv.type, index_count, indices);
  3287. }
  3288. auto indices = slice_make<i32>(permanent_allocator(), ce->args.count-1);
  3289. isize index_index = 0;
  3290. for (i32 i = 1; i < ce->args.count; i++) {
  3291. TypeAndValue tv = type_and_value_of_expr(ce->args[i]);
  3292. GB_ASSERT(is_type_integer(tv.type));
  3293. GB_ASSERT(tv.value.kind == ExactValue_Integer);
  3294. i64 src_index = big_int_to_i64(&tv.value.value_integer);
  3295. indices[index_index++] = cast(i32)src_index;
  3296. }
  3297. return lb_addr_swizzle_large(lb_addr_get_ptr(p, addr), tv.type, indices);
  3298. }
  3299. gb_internal lbAddr lb_build_addr_internal(lbProcedure *p, Ast *expr);
  3300. gb_internal lbAddr lb_build_addr(lbProcedure *p, Ast *expr) {
  3301. expr = unparen_expr(expr);
  3302. // IMPORTANT NOTE(bill):
  3303. // Selector Call Expressions (foo->bar(...))
  3304. // must only evaluate `foo` once as it gets transformed into
  3305. // `foo.bar(foo, ...)`
  3306. // And if `foo` is a procedure call or something more complex, storing the value
  3307. // once is a very good idea
  3308. // If a stored value is found, it must be removed from the cache
  3309. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  3310. lbAddr *pp = map_get(&p->selector_addr, expr);
  3311. if (pp != nullptr) {
  3312. lbAddr res = *pp;
  3313. map_remove(&p->selector_addr, expr);
  3314. return res;
  3315. }
  3316. }
  3317. lbAddr addr = lb_build_addr_internal(p, expr);
  3318. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  3319. map_set(&p->selector_addr, expr, addr);
  3320. }
  3321. return addr;
  3322. }
  3323. gb_internal void lb_build_addr_compound_lit_populate(lbProcedure *p, Slice<Ast *> const &elems, Array<lbCompoundLitElemTempData> *temp_data, Type *compound_type) {
  3324. Type *bt = base_type(compound_type);
  3325. Type *et = nullptr;
  3326. switch (bt->kind) {
  3327. case Type_Array: et = bt->Array.elem; break;
  3328. case Type_EnumeratedArray: et = bt->EnumeratedArray.elem; break;
  3329. case Type_Slice: et = bt->Slice.elem; break;
  3330. case Type_BitSet: et = bt->BitSet.elem; break;
  3331. case Type_DynamicArray: et = bt->DynamicArray.elem; break;
  3332. case Type_SimdVector: et = bt->SimdVector.elem; break;
  3333. case Type_Matrix: et = bt->Matrix.elem; break;
  3334. }
  3335. GB_ASSERT(et != nullptr);
  3336. // NOTE(bill): Separate value, gep, store into their own chunks
  3337. for_array(i, elems) {
  3338. Ast *elem = elems[i];
  3339. if (elem->kind == Ast_FieldValue) {
  3340. ast_node(fv, FieldValue, elem);
  3341. if (bt->kind != Type_DynamicArray && lb_is_elem_const(fv->value, et)) {
  3342. continue;
  3343. }
  3344. if (is_ast_range(fv->field)) {
  3345. ast_node(ie, BinaryExpr, fv->field);
  3346. TypeAndValue lo_tav = ie->left->tav;
  3347. TypeAndValue hi_tav = ie->right->tav;
  3348. GB_ASSERT(lo_tav.mode == Addressing_Constant);
  3349. GB_ASSERT(hi_tav.mode == Addressing_Constant);
  3350. TokenKind op = ie->op.kind;
  3351. i64 lo = exact_value_to_i64(lo_tav.value);
  3352. i64 hi = exact_value_to_i64(hi_tav.value);
  3353. if (op != Token_RangeHalf) {
  3354. hi += 1;
  3355. }
  3356. lbValue value = lb_emit_conv(p, lb_build_expr(p, fv->value), et);
  3357. GB_ASSERT((hi-lo) > 0);
  3358. if (bt->kind == Type_Matrix) {
  3359. for (i64 k = lo; k < hi; k++) {
  3360. lbCompoundLitElemTempData data = {};
  3361. data.value = value;
  3362. data.elem_index = matrix_row_major_index_to_offset(bt, k);
  3363. array_add(temp_data, data);
  3364. }
  3365. } else {
  3366. enum {MAX_ELEMENT_AMOUNT = 32};
  3367. if ((hi-lo) <= MAX_ELEMENT_AMOUNT) {
  3368. for (i64 k = lo; k < hi; k++) {
  3369. lbCompoundLitElemTempData data = {};
  3370. data.value = value;
  3371. data.elem_index = k;
  3372. array_add(temp_data, data);
  3373. }
  3374. } else {
  3375. lbCompoundLitElemTempData data = {};
  3376. data.value = value;
  3377. data.elem_index = lo;
  3378. data.elem_length = hi-lo;
  3379. array_add(temp_data, data);
  3380. }
  3381. }
  3382. } else {
  3383. auto tav = fv->field->tav;
  3384. GB_ASSERT(tav.mode == Addressing_Constant);
  3385. i64 index = exact_value_to_i64(tav.value);
  3386. lbValue value = lb_emit_conv(p, lb_build_expr(p, fv->value), et);
  3387. GB_ASSERT(!is_type_tuple(value.type));
  3388. lbCompoundLitElemTempData data = {};
  3389. data.value = value;
  3390. data.expr = fv->value;
  3391. if (bt->kind == Type_Matrix) {
  3392. data.elem_index = matrix_row_major_index_to_offset(bt, index);
  3393. } else {
  3394. data.elem_index = index;
  3395. }
  3396. array_add(temp_data, data);
  3397. }
  3398. } else {
  3399. if (bt->kind != Type_DynamicArray && lb_is_elem_const(elem, et)) {
  3400. continue;
  3401. }
  3402. lbValue field_expr = lb_build_expr(p, elem);
  3403. GB_ASSERT(!is_type_tuple(field_expr.type));
  3404. lbValue ev = lb_emit_conv(p, field_expr, et);
  3405. lbCompoundLitElemTempData data = {};
  3406. data.value = ev;
  3407. if (bt->kind == Type_Matrix) {
  3408. data.elem_index = matrix_row_major_index_to_offset(bt, i);
  3409. } else {
  3410. data.elem_index = i;
  3411. }
  3412. array_add(temp_data, data);
  3413. }
  3414. }
  3415. }
  3416. gb_internal void lb_build_addr_compound_lit_assign_array(lbProcedure *p, Array<lbCompoundLitElemTempData> const &temp_data) {
  3417. for (auto const &td : temp_data) {
  3418. if (td.value.value != nullptr) {
  3419. if (td.elem_length > 0) {
  3420. auto loop_data = lb_loop_start(p, cast(isize)td.elem_length, t_i32);
  3421. {
  3422. lbValue dst = td.gep;
  3423. dst = lb_emit_ptr_offset(p, dst, loop_data.idx);
  3424. lb_emit_store(p, dst, td.value);
  3425. }
  3426. lb_loop_end(p, loop_data);
  3427. } else {
  3428. lb_emit_store(p, td.gep, td.value);
  3429. }
  3430. }
  3431. }
  3432. }
  3433. gb_internal lbAddr lb_build_addr_index_expr(lbProcedure *p, Ast *expr) {
  3434. ast_node(ie, IndexExpr, expr);
  3435. Type *t = base_type(type_of_expr(ie->expr));
  3436. bool deref = is_type_pointer(t);
  3437. t = base_type(type_deref(t));
  3438. if (is_type_soa_struct(t)) {
  3439. // SOA STRUCTURES!!!!
  3440. lbValue val = lb_build_addr_ptr(p, ie->expr);
  3441. if (deref) {
  3442. val = lb_emit_load(p, val);
  3443. }
  3444. lbValue index = lb_build_expr(p, ie->index);
  3445. return lb_addr_soa_variable(val, index, ie->index);
  3446. }
  3447. if (ie->expr->tav.mode == Addressing_SoaVariable) {
  3448. // SOA Structures for slices/dynamic arrays
  3449. GB_ASSERT_MSG(is_type_multi_pointer(type_of_expr(ie->expr)), "%s", type_to_string(type_of_expr(ie->expr)));
  3450. lbValue field = lb_build_expr(p, ie->expr);
  3451. lbValue index = lb_build_expr(p, ie->index);
  3452. if (!build_context.no_bounds_check) {
  3453. Ast *se_expr = unparen_expr(ie->expr);
  3454. if (se_expr->kind == Ast_SelectorExpr) {
  3455. ast_node(se, SelectorExpr, se_expr);
  3456. lbValue len = {};
  3457. Type *type = base_type(type_deref(type_of_expr(se->expr)));
  3458. GB_ASSERT_MSG(is_type_soa_struct(type), "%s", type_to_string(type));
  3459. if (type->Struct.soa_kind == StructSoa_Fixed) {
  3460. len = lb_const_int(p->module, t_int, type->Struct.soa_count);
  3461. } else {
  3462. lbAddr *found = map_get(&p->selector_addr, se_expr);
  3463. if (found) {
  3464. lbAddr addr = *found;
  3465. lbValue parent = lb_addr_get_ptr(p, addr);
  3466. if (is_type_pointer(type_deref(parent.type))) {
  3467. parent = lb_emit_load(p, parent);
  3468. }
  3469. len = lb_soa_struct_len(p, parent);
  3470. }
  3471. }
  3472. if (len.value) {
  3473. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3474. }
  3475. } else {
  3476. // TODO(bill): how do you even do bounds checking here?
  3477. }
  3478. }
  3479. lbValue val = lb_emit_ptr_offset(p, field, index);
  3480. return lb_addr(val);
  3481. }
  3482. GB_ASSERT_MSG(is_type_indexable(t), "%s %s", type_to_string(t), expr_to_string(expr));
  3483. if (is_type_map(t)) {
  3484. lbAddr map_addr = lb_build_addr(p, ie->expr);
  3485. lbValue key = lb_build_expr(p, ie->index);
  3486. key = lb_emit_conv(p, key, t->Map.key);
  3487. Type *result_type = type_of_expr(expr);
  3488. lbValue map_ptr = lb_addr_get_ptr(p, map_addr);
  3489. if (is_type_pointer(type_deref(map_ptr.type))) {
  3490. map_ptr = lb_emit_load(p, map_ptr);
  3491. }
  3492. return lb_addr_map(map_ptr, key, t, result_type);
  3493. }
  3494. switch (t->kind) {
  3495. case Type_Array: {
  3496. lbValue array = {};
  3497. array = lb_build_addr_ptr(p, ie->expr);
  3498. if (deref) {
  3499. array = lb_emit_load(p, array);
  3500. }
  3501. lbValue index = lb_build_expr(p, ie->index);
  3502. index = lb_emit_conv(p, index, t_int);
  3503. lbValue elem = lb_emit_array_ep(p, array, index);
  3504. auto index_tv = type_and_value_of_expr(ie->index);
  3505. if (index_tv.mode != Addressing_Constant) {
  3506. lbValue len = lb_const_int(p->module, t_int, t->Array.count);
  3507. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3508. }
  3509. return lb_addr(elem);
  3510. }
  3511. case Type_EnumeratedArray: {
  3512. lbValue array = {};
  3513. array = lb_build_addr_ptr(p, ie->expr);
  3514. if (deref) {
  3515. array = lb_emit_load(p, array);
  3516. }
  3517. Type *index_type = t->EnumeratedArray.index;
  3518. auto index_tv = type_and_value_of_expr(ie->index);
  3519. lbValue index = {};
  3520. if (compare_exact_values(Token_NotEq, *t->EnumeratedArray.min_value, exact_value_i64(0))) {
  3521. if (index_tv.mode == Addressing_Constant) {
  3522. ExactValue idx = exact_value_sub(index_tv.value, *t->EnumeratedArray.min_value);
  3523. index = lb_const_value(p->module, index_type, idx);
  3524. } else {
  3525. index = lb_emit_arith(p, Token_Sub,
  3526. lb_build_expr(p, ie->index),
  3527. lb_const_value(p->module, index_type, *t->EnumeratedArray.min_value),
  3528. index_type);
  3529. index = lb_emit_conv(p, index, t_int);
  3530. }
  3531. } else {
  3532. index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3533. }
  3534. lbValue elem = lb_emit_array_ep(p, array, index);
  3535. if (index_tv.mode != Addressing_Constant) {
  3536. lbValue len = lb_const_int(p->module, t_int, t->EnumeratedArray.count);
  3537. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3538. }
  3539. return lb_addr(elem);
  3540. }
  3541. case Type_Slice: {
  3542. lbValue slice = {};
  3543. slice = lb_build_expr(p, ie->expr);
  3544. if (deref) {
  3545. slice = lb_emit_load(p, slice);
  3546. }
  3547. lbValue elem = lb_slice_elem(p, slice);
  3548. lbValue index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3549. lbValue len = lb_slice_len(p, slice);
  3550. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3551. lbValue v = lb_emit_ptr_offset(p, elem, index);
  3552. return lb_addr(v);
  3553. }
  3554. case Type_MultiPointer: {
  3555. lbValue multi_ptr = {};
  3556. multi_ptr = lb_build_expr(p, ie->expr);
  3557. if (deref) {
  3558. multi_ptr = lb_emit_load(p, multi_ptr);
  3559. }
  3560. lbValue index = lb_build_expr(p, ie->index);
  3561. index = lb_emit_conv(p, index, t_int);
  3562. lbValue v = {};
  3563. LLVMValueRef indices[1] = {index.value};
  3564. v.value = LLVMBuildGEP2(p->builder, lb_type(p->module, t->MultiPointer.elem), multi_ptr.value, indices, 1, "");
  3565. v.type = alloc_type_pointer(t->MultiPointer.elem);
  3566. return lb_addr(v);
  3567. }
  3568. case Type_RelativeMultiPointer: {
  3569. lbAddr rel_ptr_addr = {};
  3570. if (deref) {
  3571. lbValue rel_ptr_ptr = lb_build_expr(p, ie->expr);
  3572. rel_ptr_addr = lb_addr(rel_ptr_ptr);
  3573. } else {
  3574. rel_ptr_addr = lb_build_addr(p, ie->expr);
  3575. }
  3576. lbValue rel_ptr = lb_relative_pointer_to_pointer(p, rel_ptr_addr);
  3577. lbValue index = lb_build_expr(p, ie->index);
  3578. index = lb_emit_conv(p, index, t_int);
  3579. lbValue v = {};
  3580. Type *pointer_type = base_type(t->RelativeMultiPointer.pointer_type);
  3581. GB_ASSERT(pointer_type->kind == Type_MultiPointer);
  3582. Type *elem = pointer_type->MultiPointer.elem;
  3583. LLVMValueRef indices[1] = {index.value};
  3584. v.value = LLVMBuildGEP2(p->builder, lb_type(p->module, elem), rel_ptr.value, indices, 1, "");
  3585. v.type = alloc_type_pointer(elem);
  3586. return lb_addr(v);
  3587. }
  3588. case Type_DynamicArray: {
  3589. lbValue dynamic_array = {};
  3590. dynamic_array = lb_build_expr(p, ie->expr);
  3591. if (deref) {
  3592. dynamic_array = lb_emit_load(p, dynamic_array);
  3593. }
  3594. lbValue elem = lb_dynamic_array_elem(p, dynamic_array);
  3595. lbValue len = lb_dynamic_array_len(p, dynamic_array);
  3596. lbValue index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3597. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3598. lbValue v = lb_emit_ptr_offset(p, elem, index);
  3599. return lb_addr(v);
  3600. }
  3601. case Type_Matrix: {
  3602. lbValue matrix = {};
  3603. matrix = lb_build_addr_ptr(p, ie->expr);
  3604. if (deref) {
  3605. matrix = lb_emit_load(p, matrix);
  3606. }
  3607. lbValue index = lb_build_expr(p, ie->index);
  3608. index = lb_emit_conv(p, index, t_int);
  3609. isize bounds_len = 0;
  3610. lbValue elem = {};
  3611. if (t->Matrix.is_row_major) {
  3612. bounds_len = t->Matrix.row_count;
  3613. elem = lb_emit_matrix_ep(p, matrix, index, lb_const_int(p->module, t_int, 0));
  3614. } else {
  3615. bounds_len = t->Matrix.column_count;
  3616. elem = lb_emit_matrix_ep(p, matrix, lb_const_int(p->module, t_int, 0), index);
  3617. }
  3618. elem = lb_emit_conv(p, elem, alloc_type_pointer(type_of_expr(expr)));
  3619. auto index_tv = type_and_value_of_expr(ie->index);
  3620. if (index_tv.mode != Addressing_Constant) {
  3621. lbValue len = lb_const_int(p->module, t_int, bounds_len);
  3622. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3623. }
  3624. return lb_addr(elem);
  3625. }
  3626. case Type_Basic: { // Basic_string
  3627. lbValue str;
  3628. lbValue elem;
  3629. lbValue len;
  3630. lbValue index;
  3631. str = lb_build_expr(p, ie->expr);
  3632. if (deref) {
  3633. str = lb_emit_load(p, str);
  3634. }
  3635. elem = lb_string_elem(p, str);
  3636. len = lb_string_len(p, str);
  3637. index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3638. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3639. return lb_addr(lb_emit_ptr_offset(p, elem, index));
  3640. }
  3641. }
  3642. return {};
  3643. }
  3644. gb_internal lbAddr lb_build_addr_slice_expr(lbProcedure *p, Ast *expr) {
  3645. ast_node(se, SliceExpr, expr);
  3646. lbValue low = lb_const_int(p->module, t_int, 0);
  3647. lbValue high = {};
  3648. if (se->low != nullptr) {
  3649. low = lb_correct_endianness(p, lb_build_expr(p, se->low));
  3650. }
  3651. if (se->high != nullptr) {
  3652. high = lb_correct_endianness(p, lb_build_expr(p, se->high));
  3653. }
  3654. bool no_indices = se->low == nullptr && se->high == nullptr;
  3655. lbAddr addr = lb_build_addr(p, se->expr);
  3656. lbValue base = lb_addr_load(p, addr);
  3657. Type *type = base_type(base.type);
  3658. if (is_type_pointer(type)) {
  3659. type = base_type(type_deref(type));
  3660. addr = lb_addr(base);
  3661. base = lb_addr_load(p, addr);
  3662. }
  3663. switch (type->kind) {
  3664. case Type_Slice: {
  3665. Type *slice_type = type;
  3666. lbValue len = lb_slice_len(p, base);
  3667. if (high.value == nullptr) high = len;
  3668. if (!no_indices) {
  3669. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3670. }
  3671. lbValue elem = lb_emit_ptr_offset(p, lb_slice_elem(p, base), low);
  3672. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3673. lbAddr slice = lb_add_local_generated(p, slice_type, false);
  3674. lb_fill_slice(p, slice, elem, new_len);
  3675. return slice;
  3676. }
  3677. case Type_RelativePointer:
  3678. GB_PANIC("TODO(bill): Type_RelativePointer should be handled above already on the lb_addr_load");
  3679. break;
  3680. case Type_RelativeMultiPointer:
  3681. GB_PANIC("TODO(bill): Type_RelativeMultiPointer should be handled above already on the lb_addr_load");
  3682. break;
  3683. case Type_DynamicArray: {
  3684. Type *elem_type = type->DynamicArray.elem;
  3685. Type *slice_type = alloc_type_slice(elem_type);
  3686. lbValue len = lb_dynamic_array_len(p, base);
  3687. if (high.value == nullptr) high = len;
  3688. if (!no_indices) {
  3689. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3690. }
  3691. lbValue elem = lb_emit_ptr_offset(p, lb_dynamic_array_elem(p, base), low);
  3692. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3693. lbAddr slice = lb_add_local_generated(p, slice_type, false);
  3694. lb_fill_slice(p, slice, elem, new_len);
  3695. return slice;
  3696. }
  3697. case Type_MultiPointer: {
  3698. lbAddr res = lb_add_local_generated(p, type_of_expr(expr), false);
  3699. if (se->high == nullptr) {
  3700. lbValue offset = base;
  3701. LLVMValueRef indices[1] = {low.value};
  3702. offset.value = LLVMBuildGEP2(p->builder, lb_type(p->module, base_type(offset.type)->MultiPointer.elem), offset.value, indices, 1, "");
  3703. lb_addr_store(p, res, offset);
  3704. } else {
  3705. low = lb_emit_conv(p, low, t_int);
  3706. high = lb_emit_conv(p, high, t_int);
  3707. lb_emit_multi_pointer_slice_bounds_check(p, se->open, low, high);
  3708. LLVMValueRef indices[1] = {low.value};
  3709. LLVMValueRef ptr = LLVMBuildGEP2(p->builder, lb_type(p->module, base_type(base.type)->MultiPointer.elem), base.value, indices, 1, "");
  3710. LLVMValueRef len = LLVMBuildSub(p->builder, high.value, low.value, "");
  3711. LLVMValueRef gep0 = lb_emit_struct_ep(p, res.addr, 0).value;
  3712. LLVMValueRef gep1 = lb_emit_struct_ep(p, res.addr, 1).value;
  3713. LLVMBuildStore(p->builder, ptr, gep0);
  3714. LLVMBuildStore(p->builder, len, gep1);
  3715. }
  3716. return res;
  3717. }
  3718. case Type_Array: {
  3719. Type *slice_type = alloc_type_slice(type->Array.elem);
  3720. lbValue len = lb_const_int(p->module, t_int, type->Array.count);
  3721. if (high.value == nullptr) high = len;
  3722. bool low_const = type_and_value_of_expr(se->low).mode == Addressing_Constant;
  3723. bool high_const = type_and_value_of_expr(se->high).mode == Addressing_Constant;
  3724. if (!low_const || !high_const) {
  3725. if (!no_indices) {
  3726. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3727. }
  3728. }
  3729. lbValue elem = lb_emit_ptr_offset(p, lb_array_elem(p, lb_addr_get_ptr(p, addr)), low);
  3730. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3731. lbAddr slice = lb_add_local_generated(p, slice_type, false);
  3732. lb_fill_slice(p, slice, elem, new_len);
  3733. return slice;
  3734. }
  3735. case Type_Basic: {
  3736. GB_ASSERT_MSG(are_types_identical(type, t_string), "got %s", type_to_string(type));
  3737. lbValue len = lb_string_len(p, base);
  3738. if (high.value == nullptr) high = len;
  3739. if (!no_indices) {
  3740. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3741. }
  3742. lbValue elem = lb_emit_ptr_offset(p, lb_string_elem(p, base), low);
  3743. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3744. lbAddr str = lb_add_local_generated(p, t_string, false);
  3745. lb_fill_string(p, str, elem, new_len);
  3746. return str;
  3747. }
  3748. case Type_Struct:
  3749. if (is_type_soa_struct(type)) {
  3750. lbValue len = lb_soa_struct_len(p, lb_addr_get_ptr(p, addr));
  3751. if (high.value == nullptr) high = len;
  3752. if (!no_indices) {
  3753. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3754. }
  3755. #if 1
  3756. lbAddr dst = lb_add_local_generated(p, type_of_expr(expr), true);
  3757. if (type->Struct.soa_kind == StructSoa_Fixed) {
  3758. i32 field_count = cast(i32)type->Struct.fields.count;
  3759. for (i32 i = 0; i < field_count; i++) {
  3760. lbValue field_dst = lb_emit_struct_ep(p, dst.addr, i);
  3761. lbValue field_src = lb_emit_struct_ep(p, lb_addr_get_ptr(p, addr), i);
  3762. field_src = lb_emit_array_ep(p, field_src, low);
  3763. field_src = lb_emit_conv(p, field_src, type_deref(field_dst.type));
  3764. lb_emit_store(p, field_dst, field_src);
  3765. }
  3766. lbValue len_dst = lb_emit_struct_ep(p, dst.addr, field_count);
  3767. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3768. lb_emit_store(p, len_dst, new_len);
  3769. } else if (type->Struct.soa_kind == StructSoa_Slice) {
  3770. if (no_indices) {
  3771. lb_addr_store(p, dst, base);
  3772. } else {
  3773. i32 field_count = cast(i32)type->Struct.fields.count - 1;
  3774. for (i32 i = 0; i < field_count; i++) {
  3775. lbValue field_dst = lb_emit_struct_ep(p, dst.addr, i);
  3776. lbValue field_src = lb_emit_struct_ev(p, base, i);
  3777. field_src = lb_emit_ptr_offset(p, field_src, low);
  3778. field_src = lb_emit_conv(p, field_src, type_deref(field_dst.type));
  3779. lb_emit_store(p, field_dst, field_src);
  3780. }
  3781. lbValue len_dst = lb_emit_struct_ep(p, dst.addr, field_count);
  3782. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3783. lb_emit_store(p, len_dst, new_len);
  3784. }
  3785. } else if (type->Struct.soa_kind == StructSoa_Dynamic) {
  3786. i32 field_count = cast(i32)type->Struct.fields.count - 3;
  3787. for (i32 i = 0; i < field_count; i++) {
  3788. lbValue field_dst = lb_emit_struct_ep(p, dst.addr, i);
  3789. lbValue field_src = lb_emit_struct_ev(p, base, i);
  3790. field_src = lb_emit_ptr_offset(p, field_src, low);
  3791. field_src = lb_emit_conv(p, field_src, type_deref(field_dst.type));
  3792. lb_emit_store(p, field_dst, field_src);
  3793. }
  3794. lbValue len_dst = lb_emit_struct_ep(p, dst.addr, field_count);
  3795. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3796. lb_emit_store(p, len_dst, new_len);
  3797. }
  3798. return dst;
  3799. #endif
  3800. }
  3801. break;
  3802. }
  3803. GB_PANIC("Unknown slicable type");
  3804. return {};
  3805. }
  3806. gb_internal lbAddr lb_build_addr_compound_lit(lbProcedure *p, Ast *expr) {
  3807. ast_node(cl, CompoundLit, expr);
  3808. Type *type = type_of_expr(expr);
  3809. Type *bt = base_type(type);
  3810. lbAddr v = lb_add_local_generated(p, type, true);
  3811. TEMPORARY_ALLOCATOR_GUARD();
  3812. Type *et = nullptr;
  3813. switch (bt->kind) {
  3814. case Type_Array: et = bt->Array.elem; break;
  3815. case Type_EnumeratedArray: et = bt->EnumeratedArray.elem; break;
  3816. case Type_Slice: et = bt->Slice.elem; break;
  3817. case Type_BitSet: et = bt->BitSet.elem; break;
  3818. case Type_SimdVector: et = bt->SimdVector.elem; break;
  3819. case Type_Matrix: et = bt->Matrix.elem; break;
  3820. }
  3821. String proc_name = {};
  3822. if (p->entity) {
  3823. proc_name = p->entity->token.string;
  3824. }
  3825. TokenPos pos = ast_token(expr).pos;
  3826. switch (bt->kind) {
  3827. default: GB_PANIC("Unknown CompoundLit type: %s", type_to_string(type)); break;
  3828. case Type_BitField: {
  3829. TEMPORARY_ALLOCATOR_GUARD();
  3830. // Type *backing_type = core_type(bt->BitField.backing_type);
  3831. struct FieldData {
  3832. Type *field_type;
  3833. u64 bit_offset;
  3834. u64 bit_size;
  3835. };
  3836. auto values = array_make<lbValue>(temporary_allocator(), 0, cl->elems.count);
  3837. auto fields = array_make<FieldData>(temporary_allocator(), 0, cl->elems.count);
  3838. for (Ast *elem : cl->elems) {
  3839. ast_node(fv, FieldValue, elem);
  3840. String name = fv->field->Ident.token.string;
  3841. Selection sel = lookup_field(bt, name, false);
  3842. GB_ASSERT(sel.is_bit_field);
  3843. GB_ASSERT(!sel.indirect);
  3844. GB_ASSERT(sel.index.count == 1);
  3845. GB_ASSERT(sel.entity != nullptr);
  3846. i64 index = sel.index[0];
  3847. Entity *f = bt->BitField.fields[index];
  3848. GB_ASSERT(f == sel.entity);
  3849. i64 bit_offset = bt->BitField.bit_offsets[index];
  3850. i64 bit_size = bt->BitField.bit_sizes[index];
  3851. GB_ASSERT(bit_size > 0);
  3852. Type *field_type = sel.entity->type;
  3853. lbValue field_expr = lb_build_expr(p, fv->value);
  3854. field_expr = lb_emit_conv(p, field_expr, field_type);
  3855. array_add(&values, field_expr);
  3856. array_add(&fields, FieldData{field_type, cast(u64)bit_offset, cast(u64)bit_size});
  3857. }
  3858. // NOTE(bill): inline insertion sort should be good enough, right?
  3859. for (isize i = 1; i < values.count; i++) {
  3860. for (isize j = i;
  3861. j > 0 && fields[i].bit_offset < fields[j].bit_offset;
  3862. j--) {
  3863. auto vtmp = values[j];
  3864. values[j] = values[j-1];
  3865. values[j-1] = vtmp;
  3866. auto ftmp = fields[j];
  3867. fields[j] = fields[j-1];
  3868. fields[j-1] = ftmp;
  3869. }
  3870. }
  3871. bool any_fields_different_endian = false;
  3872. for (auto const &f : fields) {
  3873. if (is_type_different_to_arch_endianness(f.field_type)) {
  3874. // NOTE(bill): Just be slow for this, to be correct
  3875. any_fields_different_endian = true;
  3876. break;
  3877. }
  3878. }
  3879. if (!any_fields_different_endian &&
  3880. fields.count == bt->BitField.fields.count) {
  3881. // SINGLE INTEGER BACKING ONLY
  3882. Type *backing_type = core_type(bt->BitField.backing_type);
  3883. GB_ASSERT(is_type_integer(backing_type) ||
  3884. (is_type_array(backing_type) && is_type_integer(backing_type->Array.elem)));
  3885. // NOTE(bill): all fields are present
  3886. // this means no masking is necessary since on write, the bits will be overridden
  3887. lbValue dst_byte_ptr = lb_emit_conv(p, v.addr, t_u8_ptr);
  3888. u64 total_bit_size = cast(u64)(8*type_size_of(bt));
  3889. if (is_type_integer(backing_type)) {
  3890. LLVMTypeRef lit = lb_type(p->module, backing_type);
  3891. LLVMValueRef res = LLVMConstInt(lit, 0, false);
  3892. for (isize i = 0; i < fields.count; i++) {
  3893. auto const &f = fields[i];
  3894. LLVMValueRef mask = LLVMConstInt(lit, 1, false);
  3895. mask = LLVMConstShl(mask, LLVMConstInt(lit, f.bit_size, false));
  3896. mask = LLVMConstSub(mask, LLVMConstInt(lit, 1, false));
  3897. LLVMValueRef elem = values[i].value;
  3898. if (lb_sizeof(lit) < lb_sizeof(LLVMTypeOf(elem))) {
  3899. elem = LLVMBuildTrunc(p->builder, elem, lit, "");
  3900. } else {
  3901. elem = LLVMBuildZExt(p->builder, elem, lit, "");
  3902. }
  3903. elem = LLVMBuildAnd(p->builder, elem, mask, "");
  3904. elem = LLVMBuildShl(p->builder, elem, LLVMConstInt(lit, f.bit_offset, false), "");
  3905. res = LLVMBuildOr(p->builder, res, elem, "");
  3906. }
  3907. LLVMBuildStore(p->builder, res, v.addr.value);
  3908. } else if (is_type_array(backing_type)) {
  3909. // ARRAY OF INTEGER BACKING
  3910. i64 array_count = backing_type->Array.count;
  3911. LLVMTypeRef lit = lb_type(p->module, core_type(backing_type->Array.elem));
  3912. gb_unused(array_count);
  3913. gb_unused(lit);
  3914. LLVMValueRef *elems = gb_alloc_array(temporary_allocator(), LLVMValueRef, array_count);
  3915. for (i64 i = 0; i < array_count; i++) {
  3916. elems[i] = LLVMConstInt(lit, 0, false);
  3917. }
  3918. u64 elem_bit_size = cast(u64)(8*type_size_of(backing_type->Array.elem));
  3919. u64 curr_bit_offset = 0;
  3920. for (isize i = 0; i < fields.count; i++) {
  3921. auto const &f = fields[i];
  3922. LLVMValueRef val = values[i].value;
  3923. LLVMTypeRef vt = lb_type(p->module, values[i].type);
  3924. for (u64 bits_to_set = f.bit_size;
  3925. bits_to_set > 0;
  3926. /**/) {
  3927. i64 elem_idx = curr_bit_offset/elem_bit_size;
  3928. u64 elem_bit_offset = curr_bit_offset%elem_bit_size;
  3929. u64 mask_width = gb_min(bits_to_set, elem_bit_size-elem_bit_offset);
  3930. GB_ASSERT(mask_width > 0);
  3931. bits_to_set -= mask_width;
  3932. LLVMValueRef mask = LLVMConstInt(vt, 1, false);
  3933. mask = LLVMConstShl(mask, LLVMConstInt(vt, mask_width, false));
  3934. mask = LLVMConstSub(mask, LLVMConstInt(vt, 1, false));
  3935. LLVMValueRef to_set = LLVMBuildAnd(p->builder, val, mask, "");
  3936. if (elem_bit_offset != 0) {
  3937. to_set = LLVMBuildShl(p->builder, to_set, LLVMConstInt(vt, elem_bit_offset, false), "");
  3938. }
  3939. to_set = LLVMBuildTrunc(p->builder, to_set, lit, "");
  3940. if (LLVMIsNull(elems[elem_idx])) {
  3941. elems[elem_idx] = to_set; // don't even bother doing `0 | to_set`
  3942. } else {
  3943. elems[elem_idx] = LLVMBuildOr(p->builder, elems[elem_idx], to_set, "");
  3944. }
  3945. if (mask_width != 0) {
  3946. val = LLVMBuildLShr(p->builder, val, LLVMConstInt(vt, mask_width, false), "");
  3947. }
  3948. curr_bit_offset += mask_width;
  3949. }
  3950. GB_ASSERT(curr_bit_offset == f.bit_offset + f.bit_size);
  3951. }
  3952. for (i64 i = 0; i < array_count; i++) {
  3953. LLVMValueRef elem_ptr = LLVMBuildStructGEP2(p->builder, lb_type(p->module, backing_type), v.addr.value, cast(unsigned)i, "");
  3954. LLVMBuildStore(p->builder, elems[i], elem_ptr);
  3955. }
  3956. } else {
  3957. // SLOW STORAGE
  3958. for_array(i, fields) {
  3959. auto const &f = fields[i];
  3960. if ((f.bit_offset & 7) == 0) {
  3961. u64 unpacked_bit_size = cast(u64)(8*type_size_of(f.field_type));
  3962. u64 byte_size = (f.bit_size+7)/8;
  3963. if (f.bit_offset + unpacked_bit_size <= total_bit_size) {
  3964. byte_size = unpacked_bit_size/8;
  3965. }
  3966. lbValue dst = lb_emit_ptr_offset(p, dst_byte_ptr, lb_const_int(p->module, t_int, f.bit_offset/8));
  3967. lbValue src = lb_address_from_load_or_generate_local(p, values[i]);
  3968. lb_mem_copy_non_overlapping(p, dst, src, lb_const_int(p->module, t_uintptr, byte_size));
  3969. } else {
  3970. lbAddr dst = lb_addr_bit_field(v.addr, f.field_type, f.bit_offset, f.bit_size);
  3971. lb_addr_store(p, dst, values[i]);
  3972. }
  3973. }
  3974. }
  3975. } else {
  3976. // individual storing
  3977. for_array(i, values) {
  3978. auto const &f = fields[i];
  3979. lbAddr dst = lb_addr_bit_field(v.addr, f.field_type, f.bit_offset, f.bit_size);
  3980. lb_addr_store(p, dst, values[i]);
  3981. }
  3982. }
  3983. return v;
  3984. }
  3985. case Type_Struct: {
  3986. // TODO(bill): "constant" '#raw_union's are not initialized constantly at the moment.
  3987. // NOTE(bill): This is due to the layout of the unions when printed to LLVM-IR
  3988. bool is_raw_union = is_type_raw_union(bt);
  3989. GB_ASSERT(is_type_struct(bt) || is_raw_union);
  3990. TypeStruct *st = &bt->Struct;
  3991. if (cl->elems.count > 0) {
  3992. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  3993. lbValue comp_lit_ptr = lb_addr_get_ptr(p, v);
  3994. for_array(field_index, cl->elems) {
  3995. Ast *elem = cl->elems[field_index];
  3996. lbValue field_expr = {};
  3997. Entity *field = nullptr;
  3998. isize index = field_index;
  3999. if (elem->kind == Ast_FieldValue) {
  4000. ast_node(fv, FieldValue, elem);
  4001. String name = fv->field->Ident.token.string;
  4002. Selection sel = lookup_field(bt, name, false);
  4003. GB_ASSERT(!sel.indirect);
  4004. elem = fv->value;
  4005. if (sel.index.count > 1) {
  4006. if (lb_is_nested_possibly_constant(type, sel, elem)) {
  4007. continue;
  4008. }
  4009. field_expr = lb_build_expr(p, elem);
  4010. field_expr = lb_emit_conv(p, field_expr, sel.entity->type);
  4011. if (sel.is_bit_field) {
  4012. Selection sub_sel = trim_selection(sel);
  4013. lbValue trimmed_dst = lb_emit_deep_field_gep(p, comp_lit_ptr, sub_sel);
  4014. Type *bf = base_type(type_deref(trimmed_dst.type));
  4015. if (is_type_pointer(bf)) {
  4016. trimmed_dst = lb_emit_load(p, trimmed_dst);
  4017. bf = base_type(type_deref(trimmed_dst.type));
  4018. }
  4019. GB_ASSERT(bf->kind == Type_BitField);
  4020. isize idx = sel.index[sel.index.count-1];
  4021. lbAddr dst = lb_addr_bit_field(trimmed_dst, bf->BitField.fields[idx]->type, bf->BitField.bit_offsets[idx], bf->BitField.bit_sizes[idx]);
  4022. lb_addr_store(p, dst, field_expr);
  4023. } else {
  4024. lbValue dst = lb_emit_deep_field_gep(p, comp_lit_ptr, sel);
  4025. lb_emit_store(p, dst, field_expr);
  4026. }
  4027. continue;
  4028. }
  4029. index = sel.index[0];
  4030. } else {
  4031. Selection sel = lookup_field_from_index(bt, st->fields[field_index]->Variable.field_index);
  4032. GB_ASSERT(sel.index.count == 1);
  4033. GB_ASSERT(!sel.indirect);
  4034. index = sel.index[0];
  4035. }
  4036. field = st->fields[index];
  4037. Type *ft = field->type;
  4038. if (!is_raw_union && !is_type_typeid(ft) && lb_is_elem_const(elem, ft)) {
  4039. continue;
  4040. }
  4041. field_expr = lb_build_expr(p, elem);
  4042. lbValue gep = {};
  4043. if (is_raw_union) {
  4044. gep = lb_emit_conv(p, comp_lit_ptr, alloc_type_pointer(ft));
  4045. } else {
  4046. gep = lb_emit_struct_ep(p, comp_lit_ptr, cast(i32)index);
  4047. }
  4048. Type *fet = field_expr.type;
  4049. GB_ASSERT(fet->kind != Type_Tuple);
  4050. // HACK TODO(bill): THIS IS A MASSIVE HACK!!!!
  4051. if (is_type_union(ft) && !are_types_identical(fet, ft) && !is_type_untyped(fet)) {
  4052. GB_ASSERT_MSG(union_variant_index(ft, fet) >= 0, "%s", type_to_string(fet));
  4053. lb_emit_store_union_variant(p, gep, field_expr, fet);
  4054. } else {
  4055. lbValue fv = lb_emit_conv(p, field_expr, ft);
  4056. lb_emit_store(p, gep, fv);
  4057. }
  4058. }
  4059. }
  4060. break;
  4061. }
  4062. case Type_Map: {
  4063. if (cl->elems.count == 0) {
  4064. break;
  4065. }
  4066. GB_ASSERT(!build_context.no_dynamic_literals);
  4067. lbValue err = lb_dynamic_map_reserve(p, v.addr, 2*cl->elems.count, pos);
  4068. gb_unused(err);
  4069. for (Ast *elem : cl->elems) {
  4070. ast_node(fv, FieldValue, elem);
  4071. lbValue key = lb_build_expr(p, fv->field);
  4072. lbValue value = lb_build_expr(p, fv->value);
  4073. lb_internal_dynamic_map_set(p, v.addr, type, key, value, elem);
  4074. }
  4075. break;
  4076. }
  4077. case Type_Array: {
  4078. if (cl->elems.count > 0) {
  4079. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4080. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4081. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4082. lbValue dst_ptr = lb_addr_get_ptr(p, v);
  4083. for_array(i, temp_data) {
  4084. i32 index = cast(i32)(temp_data[i].elem_index);
  4085. temp_data[i].gep = lb_emit_array_epi(p, dst_ptr, index);
  4086. }
  4087. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4088. }
  4089. break;
  4090. }
  4091. case Type_EnumeratedArray: {
  4092. if (cl->elems.count > 0) {
  4093. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4094. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4095. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4096. lbValue dst_ptr = lb_addr_get_ptr(p, v);
  4097. i64 index_offset = exact_value_to_i64(*bt->EnumeratedArray.min_value);
  4098. for_array(i, temp_data) {
  4099. i32 index = cast(i32)(temp_data[i].elem_index - index_offset);
  4100. temp_data[i].gep = lb_emit_array_epi(p, dst_ptr, index);
  4101. }
  4102. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4103. }
  4104. break;
  4105. }
  4106. case Type_Slice: {
  4107. if (cl->elems.count > 0) {
  4108. lbValue slice = lb_const_value(p->module, type, exact_value_compound(expr));
  4109. lbValue data = lb_slice_elem(p, slice);
  4110. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4111. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4112. for_array(i, temp_data) {
  4113. temp_data[i].gep = lb_emit_ptr_offset(p, data, lb_const_int(p->module, t_int, temp_data[i].elem_index));
  4114. }
  4115. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4116. {
  4117. lbValue count = {};
  4118. count.type = t_int;
  4119. unsigned len_index = lb_convert_struct_index(p->module, type, 1);
  4120. if (lb_is_const(slice)) {
  4121. unsigned indices[1] = {len_index};
  4122. count.value = llvm_const_extract_value(p->module, slice.value, indices, gb_count_of(indices));
  4123. } else {
  4124. count.value = LLVMBuildExtractValue(p->builder, slice.value, len_index, "");
  4125. }
  4126. lb_fill_slice(p, v, data, count);
  4127. }
  4128. }
  4129. break;
  4130. }
  4131. case Type_DynamicArray: {
  4132. if (cl->elems.count == 0) {
  4133. break;
  4134. }
  4135. GB_ASSERT(!build_context.no_dynamic_literals);
  4136. Type *et = bt->DynamicArray.elem;
  4137. lbValue size = lb_const_int(p->module, t_int, type_size_of(et));
  4138. lbValue align = lb_const_int(p->module, t_int, type_align_of(et));
  4139. i64 item_count = gb_max(cl->max_count, cl->elems.count);
  4140. {
  4141. auto args = array_make<lbValue>(temporary_allocator(), 5);
  4142. args[0] = lb_emit_conv(p, lb_addr_get_ptr(p, v), t_rawptr);
  4143. args[1] = size;
  4144. args[2] = align;
  4145. args[3] = lb_const_int(p->module, t_int, item_count);
  4146. args[4] = lb_emit_source_code_location_as_global(p, proc_name, pos);
  4147. lb_emit_runtime_call(p, "__dynamic_array_reserve", args);
  4148. }
  4149. lbValue items = lb_generate_local_array(p, et, item_count);
  4150. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4151. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4152. for_array(i, temp_data) {
  4153. temp_data[i].gep = lb_emit_array_epi(p, items, temp_data[i].elem_index);
  4154. }
  4155. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4156. {
  4157. auto args = array_make<lbValue>(temporary_allocator(), 6);
  4158. args[0] = lb_emit_conv(p, v.addr, t_rawptr);
  4159. args[1] = size;
  4160. args[2] = align;
  4161. args[3] = lb_emit_conv(p, items, t_rawptr);
  4162. args[4] = lb_const_int(p->module, t_int, item_count);
  4163. args[5] = lb_emit_source_code_location_as_global(p, proc_name, pos);
  4164. lb_emit_runtime_call(p, "__dynamic_array_append", args);
  4165. }
  4166. break;
  4167. }
  4168. case Type_Basic: {
  4169. GB_ASSERT(is_type_any(bt));
  4170. if (cl->elems.count > 0) {
  4171. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4172. String field_names[2] = {
  4173. str_lit("data"),
  4174. str_lit("id"),
  4175. };
  4176. Type *field_types[2] = {
  4177. t_rawptr,
  4178. t_typeid,
  4179. };
  4180. for_array(field_index, cl->elems) {
  4181. Ast *elem = cl->elems[field_index];
  4182. lbValue field_expr = {};
  4183. isize index = field_index;
  4184. if (elem->kind == Ast_FieldValue) {
  4185. ast_node(fv, FieldValue, elem);
  4186. Selection sel = lookup_field(bt, fv->field->Ident.token.string, false);
  4187. index = sel.index[0];
  4188. elem = fv->value;
  4189. } else {
  4190. TypeAndValue tav = type_and_value_of_expr(elem);
  4191. Selection sel = lookup_field(bt, field_names[field_index], false);
  4192. index = sel.index[0];
  4193. }
  4194. field_expr = lb_build_expr(p, elem);
  4195. GB_ASSERT(field_expr.type->kind != Type_Tuple);
  4196. Type *ft = field_types[index];
  4197. lbValue fv = lb_emit_conv(p, field_expr, ft);
  4198. lbValue gep = lb_emit_struct_ep(p, lb_addr_get_ptr(p, v), cast(i32)index);
  4199. lb_emit_store(p, gep, fv);
  4200. }
  4201. }
  4202. break;
  4203. }
  4204. case Type_BitSet: {
  4205. i64 sz = type_size_of(type);
  4206. if (cl->elems.count > 0 && sz > 0) {
  4207. lbValue lower = lb_const_value(p->module, t_int, exact_value_i64(bt->BitSet.lower));
  4208. Type *backing = bit_set_to_int(type);
  4209. if (is_type_array(backing)) {
  4210. GB_PANIC("TODO: bit_set [N]T");
  4211. Type *base_it = core_array_type(backing);
  4212. i64 bits_per_elem = 8*type_size_of(base_it);
  4213. gb_unused(bits_per_elem);
  4214. lbValue one = lb_const_value(p->module, t_i64, exact_value_i64(1));
  4215. for (Ast *elem : cl->elems) {
  4216. GB_ASSERT(elem->kind != Ast_FieldValue);
  4217. lbValue expr = lb_build_expr(p, elem);
  4218. GB_ASSERT(expr.type->kind != Type_Tuple);
  4219. lbValue e = lb_emit_conv(p, expr, t_i64);
  4220. e = lb_emit_arith(p, Token_Sub, e, lower, t_i64);
  4221. // lbValue idx = lb_emit_arith(p, Token_Div, e, bits_per_elem, t_i64);
  4222. // lbValue val = lb_emit_arith(p, Token_Div, e, bits_per_elem, t_i64);
  4223. }
  4224. } else {
  4225. Type *it = bit_set_to_int(bt);
  4226. lbValue one = lb_const_value(p->module, it, exact_value_i64(1));
  4227. for (Ast *elem : cl->elems) {
  4228. GB_ASSERT(elem->kind != Ast_FieldValue);
  4229. lbValue expr = lb_build_expr(p, elem);
  4230. GB_ASSERT(expr.type->kind != Type_Tuple);
  4231. lbValue e = lb_emit_conv(p, expr, it);
  4232. e = lb_emit_arith(p, Token_Sub, e, lower, it);
  4233. e = lb_emit_arith(p, Token_Shl, one, e, it);
  4234. lbValue old_value = lb_emit_transmute(p, lb_addr_load(p, v), it);
  4235. lbValue new_value = lb_emit_arith(p, Token_Or, old_value, e, it);
  4236. new_value = lb_emit_transmute(p, new_value, type);
  4237. lb_addr_store(p, v, new_value);
  4238. }
  4239. }
  4240. }
  4241. break;
  4242. }
  4243. case Type_Matrix: {
  4244. if (cl->elems.count > 0) {
  4245. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4246. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4247. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4248. lbValue dst_ptr = lb_addr_get_ptr(p, v);
  4249. for_array(i, temp_data) {
  4250. temp_data[i].gep = lb_emit_array_epi(p, dst_ptr, temp_data[i].elem_index);
  4251. }
  4252. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4253. }
  4254. break;
  4255. }
  4256. case Type_SimdVector: {
  4257. if (cl->elems.count > 0) {
  4258. lbValue vector_value = lb_const_value(p->module, type, exact_value_compound(expr));
  4259. defer (lb_addr_store(p, v, vector_value));
  4260. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4261. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4262. // TODO(bill): reduce the need for individual `insertelement` if a `shufflevector`
  4263. // might be a better option
  4264. for (auto const &td : temp_data) {
  4265. if (td.value.value != nullptr) {
  4266. if (td.elem_length > 0) {
  4267. for (i64 k = 0; k < td.elem_length; k++) {
  4268. LLVMValueRef index = lb_const_int(p->module, t_u32, td.elem_index + k).value;
  4269. vector_value.value = LLVMBuildInsertElement(p->builder, vector_value.value, td.value.value, index, "");
  4270. }
  4271. } else {
  4272. LLVMValueRef index = lb_const_int(p->module, t_u32, td.elem_index).value;
  4273. vector_value.value = LLVMBuildInsertElement(p->builder, vector_value.value, td.value.value, index, "");
  4274. }
  4275. }
  4276. }
  4277. }
  4278. break;
  4279. }
  4280. }
  4281. return v;
  4282. }
  4283. gb_internal lbAddr lb_build_addr_internal(lbProcedure *p, Ast *expr) {
  4284. switch (expr->kind) {
  4285. case_ast_node(i, Implicit, expr);
  4286. lbAddr v = {};
  4287. switch (i->kind) {
  4288. case Token_context:
  4289. v = lb_find_or_generate_context_ptr(p);
  4290. break;
  4291. }
  4292. GB_ASSERT(v.addr.value != nullptr);
  4293. return v;
  4294. case_end;
  4295. case_ast_node(i, Ident, expr);
  4296. if (is_blank_ident(expr)) {
  4297. lbAddr val = {};
  4298. return val;
  4299. }
  4300. String name = i->token.string;
  4301. Entity *e = entity_of_node(expr);
  4302. return lb_build_addr_from_entity(p, e, expr);
  4303. case_end;
  4304. case_ast_node(se, SelectorExpr, expr);
  4305. Ast *sel_node = unparen_expr(se->selector);
  4306. if (sel_node->kind == Ast_Ident) {
  4307. String selector = sel_node->Ident.token.string;
  4308. TypeAndValue tav = type_and_value_of_expr(se->expr);
  4309. if (tav.mode == Addressing_Invalid) {
  4310. // NOTE(bill): Imports
  4311. Entity *imp = entity_of_node(se->expr);
  4312. if (imp != nullptr) {
  4313. GB_ASSERT(imp->kind == Entity_ImportName);
  4314. }
  4315. return lb_build_addr(p, unparen_expr(se->selector));
  4316. }
  4317. Type *type = base_type(tav.type);
  4318. if (tav.mode == Addressing_Type) { // Addressing_Type
  4319. Selection sel = lookup_field(tav.type, selector, true);
  4320. if (sel.pseudo_field) {
  4321. GB_ASSERT(sel.entity->kind == Entity_Procedure || sel.entity->kind == Entity_ProcGroup);
  4322. Entity *e = entity_of_node(sel_node);
  4323. GB_ASSERT(e->kind == Entity_Procedure);
  4324. return lb_addr(lb_find_value_from_entity(p->module, e));
  4325. }
  4326. GB_PANIC("Unreachable %.*s", LIT(selector));
  4327. }
  4328. if (se->swizzle_count > 0) {
  4329. Type *array_type = base_type(type_deref(tav.type));
  4330. GB_ASSERT(array_type->kind == Type_Array || array_type->kind == Type_SimdVector);
  4331. u8 swizzle_count = se->swizzle_count;
  4332. u8 swizzle_indices_raw = se->swizzle_indices;
  4333. u8 swizzle_indices[4] = {};
  4334. for (u8 i = 0; i < swizzle_count; i++) {
  4335. u8 index = swizzle_indices_raw>>(i*2) & 3;
  4336. swizzle_indices[i] = index;
  4337. }
  4338. lbValue a = {};
  4339. if (is_type_pointer(tav.type)) {
  4340. a = lb_build_expr(p, se->expr);
  4341. } else {
  4342. lbAddr addr = lb_build_addr(p, se->expr);
  4343. a = lb_addr_get_ptr(p, addr);
  4344. }
  4345. Type *type = type_deref(expr->tav.type);
  4346. GB_ASSERT(is_type_array(type) || is_type_simd_vector(type));
  4347. return lb_addr_swizzle(a, type, swizzle_count, swizzle_indices);
  4348. }
  4349. Selection sel = lookup_field(type, selector, false);
  4350. GB_ASSERT(sel.entity != nullptr);
  4351. if (sel.pseudo_field) {
  4352. GB_ASSERT(sel.entity->kind == Entity_Procedure || sel.entity->kind == Entity_ProcGroup);
  4353. Entity *e = entity_of_node(sel_node);
  4354. GB_ASSERT(e->kind == Entity_Procedure);
  4355. return lb_addr(lb_find_value_from_entity(p->module, e));
  4356. }
  4357. if (sel.is_bit_field) {
  4358. lbAddr addr = lb_build_addr(p, se->expr);
  4359. Selection sub_sel = sel;
  4360. sub_sel.index.count -= 1;
  4361. lbValue ptr = lb_addr_get_ptr(p, addr);
  4362. if (sub_sel.index.count > 0) {
  4363. ptr = lb_emit_deep_field_gep(p, ptr, sub_sel);
  4364. }
  4365. if (is_type_pointer(type_deref(ptr.type))) {
  4366. ptr = lb_emit_load(p, ptr);
  4367. }
  4368. Type *bf_type = type_deref(ptr.type);
  4369. bf_type = base_type(bf_type);
  4370. GB_ASSERT(bf_type->kind == Type_BitField);
  4371. i32 index = sel.index[sel.index.count-1];
  4372. Entity *f = bf_type->BitField.fields[index];
  4373. u8 bit_size = bf_type->BitField.bit_sizes[index];
  4374. i64 bit_offset = bf_type->BitField.bit_offsets[index];
  4375. return lb_addr_bit_field(ptr, f->type, bit_offset, bit_size);
  4376. }
  4377. {
  4378. lbAddr addr = lb_build_addr(p, se->expr);
  4379. if (addr.kind == lbAddr_Map) {
  4380. lbValue v = lb_addr_load(p, addr);
  4381. lbValue a = lb_address_from_load_or_generate_local(p, v);
  4382. a = lb_emit_deep_field_gep(p, a, sel);
  4383. return lb_addr(a);
  4384. } else if (addr.kind == lbAddr_Context) {
  4385. GB_ASSERT(sel.index.count > 0);
  4386. if (addr.ctx.sel.index.count >= 0) {
  4387. sel = selection_combine(addr.ctx.sel, sel);
  4388. }
  4389. addr.ctx.sel = sel;
  4390. addr.kind = lbAddr_Context;
  4391. return addr;
  4392. } else if (addr.kind == lbAddr_SoaVariable) {
  4393. lbValue index = addr.soa.index;
  4394. i32 first_index = sel.index[0];
  4395. Selection sub_sel = sel;
  4396. sub_sel.index.data += 1;
  4397. sub_sel.index.count -= 1;
  4398. lbValue arr = lb_emit_struct_ep(p, addr.addr, first_index);
  4399. Type *t = base_type(type_deref(addr.addr.type));
  4400. GB_ASSERT(is_type_soa_struct(t));
  4401. if (addr.soa.index_expr != nullptr && (!lb_is_const(addr.soa.index) || t->Struct.soa_kind != StructSoa_Fixed)) {
  4402. lbValue len = lb_soa_struct_len(p, addr.addr);
  4403. lb_emit_bounds_check(p, ast_token(addr.soa.index_expr), addr.soa.index, len);
  4404. }
  4405. lbValue item = {};
  4406. if (t->Struct.soa_kind == StructSoa_Fixed) {
  4407. item = lb_emit_array_ep(p, arr, index);
  4408. } else {
  4409. item = lb_emit_ptr_offset(p, lb_emit_load(p, arr), index);
  4410. }
  4411. if (sub_sel.index.count > 0) {
  4412. item = lb_emit_deep_field_gep(p, item, sub_sel);
  4413. }
  4414. // make sure it's ^T and not [^]T
  4415. item.type = alloc_type_multi_pointer_to_pointer(item.type);
  4416. return lb_addr(item);
  4417. } else if (addr.kind == lbAddr_Swizzle) {
  4418. GB_ASSERT(sel.index.count > 0);
  4419. // NOTE(bill): just patch the index in place
  4420. sel.index[0] = addr.swizzle.indices[sel.index[0]];
  4421. } else if (addr.kind == lbAddr_SwizzleLarge) {
  4422. GB_ASSERT(sel.index.count > 0);
  4423. // NOTE(bill): just patch the index in place
  4424. sel.index[0] = addr.swizzle.indices[sel.index[0]];
  4425. }
  4426. Type *atype = type_deref(lb_addr_type(addr));
  4427. if (is_type_soa_struct(atype)) {
  4428. map_set(&p->selector_addr, expr, addr);
  4429. }
  4430. lbValue a = lb_addr_get_ptr(p, addr);
  4431. a = lb_emit_deep_field_gep(p, a, sel);
  4432. return lb_addr(a);
  4433. }
  4434. } else {
  4435. GB_PANIC("Unsupported selector expression");
  4436. }
  4437. case_end;
  4438. case_ast_node(se, SelectorCallExpr, expr);
  4439. lbValue e = lb_build_expr(p, expr);
  4440. return lb_addr(lb_address_from_load_or_generate_local(p, e));
  4441. case_end;
  4442. case_ast_node(ta, TypeAssertion, expr);
  4443. TokenPos pos = ast_token(expr).pos;
  4444. lbValue e = lb_build_expr(p, ta->expr);
  4445. Type *t = type_deref(e.type);
  4446. if (is_type_union(t)) {
  4447. Type *type = type_of_expr(expr);
  4448. lbAddr v = lb_add_local_generated(p, type, false);
  4449. lb_addr_store(p, v, lb_emit_union_cast(p, lb_build_expr(p, ta->expr), type, pos));
  4450. return v;
  4451. } else if (is_type_any(t)) {
  4452. Type *type = type_of_expr(expr);
  4453. return lb_emit_any_cast_addr(p, lb_build_expr(p, ta->expr), type, pos);
  4454. } else {
  4455. GB_PANIC("TODO(bill): type assertion %s", type_to_string(e.type));
  4456. }
  4457. case_end;
  4458. case_ast_node(ue, UnaryExpr, expr);
  4459. switch (ue->op.kind) {
  4460. case Token_And: {
  4461. lbValue ptr = lb_build_expr(p, expr);
  4462. return lb_addr(lb_address_from_load_or_generate_local(p, ptr));
  4463. }
  4464. default:
  4465. GB_PANIC("Invalid unary expression for lb_build_addr");
  4466. }
  4467. case_end;
  4468. case_ast_node(be, BinaryExpr, expr);
  4469. lbValue v = lb_build_expr(p, expr);
  4470. Type *t = v.type;
  4471. if (is_type_pointer(t)) {
  4472. return lb_addr(v);
  4473. }
  4474. return lb_addr(lb_address_from_load_or_generate_local(p, v));
  4475. case_end;
  4476. case_ast_node(ie, IndexExpr, expr);
  4477. return lb_build_addr_index_expr(p, expr);
  4478. case_end;
  4479. case_ast_node(ie, MatrixIndexExpr, expr);
  4480. Type *t = base_type(type_of_expr(ie->expr));
  4481. bool deref = is_type_pointer(t);
  4482. t = base_type(type_deref(t));
  4483. lbValue m = {};
  4484. m = lb_build_addr_ptr(p, ie->expr);
  4485. if (deref) {
  4486. m = lb_emit_load(p, m);
  4487. }
  4488. lbValue row_index = lb_build_expr(p, ie->row_index);
  4489. lbValue column_index = lb_build_expr(p, ie->column_index);
  4490. row_index = lb_emit_conv(p, row_index, t_int);
  4491. column_index = lb_emit_conv(p, column_index, t_int);
  4492. lbValue elem = lb_emit_matrix_ep(p, m, row_index, column_index);
  4493. auto row_index_tv = type_and_value_of_expr(ie->row_index);
  4494. auto column_index_tv = type_and_value_of_expr(ie->column_index);
  4495. if (row_index_tv.mode != Addressing_Constant || column_index_tv.mode != Addressing_Constant) {
  4496. lbValue row_count = lb_const_int(p->module, t_int, t->Matrix.row_count);
  4497. lbValue column_count = lb_const_int(p->module, t_int, t->Matrix.column_count);
  4498. lb_emit_matrix_bounds_check(p, ast_token(ie->row_index), row_index, column_index, row_count, column_count);
  4499. }
  4500. return lb_addr(elem);
  4501. case_end;
  4502. case_ast_node(se, SliceExpr, expr);
  4503. return lb_build_addr_slice_expr(p, expr);
  4504. case_end;
  4505. case_ast_node(de, DerefExpr, expr);
  4506. Type *t = type_of_expr(de->expr);
  4507. if (is_type_relative_pointer(t)) {
  4508. lbAddr addr = lb_build_addr(p, de->expr);
  4509. addr.relative.deref = true;
  4510. return addr;
  4511. } else if (is_type_soa_pointer(t)) {
  4512. lbValue value = lb_build_expr(p, de->expr);
  4513. lbValue ptr = lb_emit_struct_ev(p, value, 0);
  4514. lbValue idx = lb_emit_struct_ev(p, value, 1);
  4515. return lb_addr_soa_variable(ptr, idx, nullptr);
  4516. }
  4517. lbValue addr = lb_build_expr(p, de->expr);
  4518. return lb_addr(addr);
  4519. case_end;
  4520. case_ast_node(ce, CallExpr, expr);
  4521. BuiltinProcId builtin_id = BuiltinProc_Invalid;
  4522. if (ce->proc->tav.mode == Addressing_Builtin) {
  4523. Entity *e = entity_of_node(ce->proc);
  4524. if (e != nullptr) {
  4525. builtin_id = cast(BuiltinProcId)e->Builtin.id;
  4526. } else {
  4527. builtin_id = BuiltinProc_DIRECTIVE;
  4528. }
  4529. }
  4530. auto const &tv = expr->tav;
  4531. if (builtin_id == BuiltinProc_swizzle &&
  4532. is_type_array(tv.type)) {
  4533. // NOTE(bill, 2021-08-09): `swizzle` has some bizarre semantics so it needs to be
  4534. // specialized here for to be addressable
  4535. return lb_build_array_swizzle_addr(p, ce, tv);
  4536. }
  4537. // NOTE(bill): This is make sure you never need to have an 'array_ev'
  4538. lbValue e = lb_build_expr(p, expr);
  4539. #if 1
  4540. return lb_addr(lb_address_from_load_or_generate_local(p, e));
  4541. #else
  4542. lbAddr v = lb_add_local_generated(p, e.type, false);
  4543. lb_addr_store(p, v, e);
  4544. return v;
  4545. #endif
  4546. case_end;
  4547. case_ast_node(cl, CompoundLit, expr);
  4548. return lb_build_addr_compound_lit(p, expr);
  4549. case_end;
  4550. case_ast_node(tc, TypeCast, expr);
  4551. Type *type = type_of_expr(expr);
  4552. lbValue x = lb_build_expr(p, tc->expr);
  4553. lbValue e = {};
  4554. switch (tc->token.kind) {
  4555. case Token_cast:
  4556. e = lb_emit_conv(p, x, type);
  4557. break;
  4558. case Token_transmute:
  4559. e = lb_emit_transmute(p, x, type);
  4560. break;
  4561. default:
  4562. GB_PANIC("Invalid AST TypeCast");
  4563. }
  4564. lbAddr v = lb_add_local_generated(p, type, false);
  4565. lb_addr_store(p, v, e);
  4566. return v;
  4567. case_end;
  4568. case_ast_node(ac, AutoCast, expr);
  4569. return lb_build_addr(p, ac->expr);
  4570. case_end;
  4571. case_ast_node(te, TernaryIfExpr, expr);
  4572. LLVMValueRef incoming_values[2] = {};
  4573. LLVMBasicBlockRef incoming_blocks[2] = {};
  4574. GB_ASSERT(te->y != nullptr);
  4575. lbBlock *then = lb_create_block(p, "if.then");
  4576. lbBlock *done = lb_create_block(p, "if.done"); // NOTE(bill): Append later
  4577. lbBlock *else_ = lb_create_block(p, "if.else");
  4578. lb_build_cond(p, te->cond, then, else_);
  4579. lb_start_block(p, then);
  4580. Type *ptr_type = alloc_type_pointer(default_type(type_of_expr(expr)));
  4581. incoming_values[0] = lb_emit_conv(p, lb_build_addr_ptr(p, te->x), ptr_type).value;
  4582. lb_emit_jump(p, done);
  4583. lb_start_block(p, else_);
  4584. incoming_values[1] = lb_emit_conv(p, lb_build_addr_ptr(p, te->y), ptr_type).value;
  4585. lb_emit_jump(p, done);
  4586. lb_start_block(p, done);
  4587. lbValue res = {};
  4588. res.value = LLVMBuildPhi(p->builder, lb_type(p->module, ptr_type), "");
  4589. res.type = ptr_type;
  4590. GB_ASSERT(p->curr_block->preds.count >= 2);
  4591. incoming_blocks[0] = p->curr_block->preds[0]->block;
  4592. incoming_blocks[1] = p->curr_block->preds[1]->block;
  4593. LLVMAddIncoming(res.value, incoming_values, incoming_blocks, 2);
  4594. return lb_addr(res);
  4595. case_end;
  4596. case_ast_node(oe, OrElseExpr, expr);
  4597. lbValue ptr = lb_address_from_load_or_generate_local(p, lb_build_expr(p, expr));
  4598. return lb_addr(ptr);
  4599. case_end;
  4600. case_ast_node(oe, OrReturnExpr, expr);
  4601. lbValue ptr = lb_address_from_load_or_generate_local(p, lb_build_expr(p, expr));
  4602. return lb_addr(ptr);
  4603. case_end;
  4604. case_ast_node(be, OrBranchExpr, expr);
  4605. lbBlock *block = nullptr;
  4606. if (be->label != nullptr) {
  4607. lbBranchBlocks bb = lb_lookup_branch_blocks(p, be->label);
  4608. switch (be->token.kind) {
  4609. case Token_or_break: block = bb.break_; break;
  4610. case Token_or_continue: block = bb.continue_; break;
  4611. }
  4612. } else {
  4613. for (lbTargetList *t = p->target_list; t != nullptr && block == nullptr; t = t->prev) {
  4614. if (t->is_block) {
  4615. continue;
  4616. }
  4617. switch (be->token.kind) {
  4618. case Token_or_break: block = t->break_; break;
  4619. case Token_or_continue: block = t->continue_; break;
  4620. }
  4621. }
  4622. }
  4623. GB_ASSERT(block != nullptr);
  4624. TypeAndValue tv = expr->tav;
  4625. lbValue lhs = {};
  4626. lbValue rhs = {};
  4627. lb_emit_try_lhs_rhs(p, be->expr, tv, &lhs, &rhs);
  4628. Type *type = default_type(tv.type);
  4629. if (lhs.value) {
  4630. lhs = lb_emit_conv(p, lhs, type);
  4631. } else if (type != nullptr && type != t_invalid) {
  4632. lhs = lb_const_nil(p->module, type);
  4633. }
  4634. lbBlock *then = lb_create_block(p, "or_branch.then");
  4635. lbBlock *else_ = lb_create_block(p, "or_branch.else");
  4636. lb_emit_if(p, lb_emit_try_has_value(p, rhs), then, else_);
  4637. lb_start_block(p, else_);
  4638. lb_emit_defer_stmts(p, lbDeferExit_Branch, block);
  4639. lb_emit_jump(p, block);
  4640. lb_start_block(p, then);
  4641. return lb_addr(lb_address_from_load_or_generate_local(p, lhs));
  4642. case_end;
  4643. }
  4644. TokenPos token_pos = ast_token(expr).pos;
  4645. GB_PANIC("Unexpected address expression\n"
  4646. "\tAst: %.*s @ "
  4647. "%s\n",
  4648. LIT(ast_strings[expr->kind]),
  4649. token_pos_to_string(token_pos));
  4650. return {};
  4651. }