llvm_backend_expr.cpp 173 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889389038913892389338943895389638973898389939003901390239033904390539063907390839093910391139123913391439153916391739183919392039213922392339243925392639273928392939303931393239333934393539363937393839393940394139423943394439453946394739483949395039513952395339543955395639573958395939603961396239633964396539663967396839693970397139723973397439753976397739783979398039813982398339843985398639873988398939903991399239933994399539963997399839994000400140024003400440054006400740084009401040114012401340144015401640174018401940204021402240234024402540264027402840294030403140324033403440354036403740384039404040414042404340444045404640474048404940504051405240534054405540564057405840594060406140624063406440654066406740684069407040714072407340744075407640774078407940804081408240834084408540864087408840894090409140924093409440954096409740984099410041014102410341044105410641074108410941104111411241134114411541164117411841194120412141224123412441254126412741284129413041314132413341344135413641374138413941404141414241434144414541464147414841494150415141524153415441554156415741584159416041614162416341644165416641674168416941704171417241734174417541764177417841794180418141824183418441854186418741884189419041914192419341944195419641974198419942004201420242034204420542064207420842094210421142124213421442154216421742184219422042214222422342244225422642274228422942304231423242334234423542364237423842394240424142424243424442454246424742484249425042514252425342544255425642574258425942604261426242634264426542664267426842694270427142724273427442754276427742784279428042814282428342844285428642874288428942904291429242934294429542964297429842994300430143024303430443054306430743084309431043114312431343144315431643174318431943204321432243234324432543264327432843294330433143324333433443354336433743384339434043414342434343444345434643474348434943504351435243534354435543564357435843594360436143624363436443654366436743684369437043714372437343744375437643774378437943804381438243834384438543864387438843894390439143924393439443954396439743984399440044014402440344044405440644074408440944104411441244134414441544164417441844194420442144224423442444254426442744284429443044314432443344344435443644374438443944404441444244434444444544464447444844494450445144524453445444554456445744584459446044614462446344644465446644674468446944704471447244734474447544764477447844794480448144824483448444854486448744884489449044914492449344944495449644974498449945004501450245034504450545064507450845094510451145124513451445154516451745184519452045214522452345244525452645274528452945304531453245334534453545364537453845394540454145424543454445454546454745484549455045514552455345544555455645574558455945604561456245634564456545664567456845694570457145724573457445754576457745784579458045814582458345844585458645874588458945904591459245934594459545964597459845994600460146024603460446054606460746084609461046114612461346144615461646174618461946204621462246234624462546264627462846294630463146324633463446354636463746384639464046414642464346444645464646474648464946504651465246534654465546564657465846594660466146624663466446654666466746684669467046714672467346744675467646774678467946804681468246834684468546864687468846894690469146924693469446954696469746984699470047014702470347044705470647074708470947104711471247134714471547164717471847194720472147224723472447254726472747284729473047314732473347344735473647374738473947404741474247434744474547464747474847494750475147524753475447554756475747584759476047614762476347644765476647674768476947704771477247734774477547764777477847794780478147824783478447854786478747884789479047914792479347944795479647974798479948004801480248034804480548064807480848094810481148124813481448154816481748184819482048214822482348244825482648274828482948304831483248334834483548364837483848394840484148424843484448454846484748484849485048514852485348544855485648574858485948604861486248634864486548664867486848694870487148724873487448754876487748784879488048814882488348844885488648874888488948904891489248934894489548964897489848994900490149024903490449054906490749084909491049114912491349144915491649174918491949204921492249234924492549264927492849294930493149324933493449354936493749384939494049414942494349444945494649474948494949504951495249534954495549564957495849594960496149624963496449654966496749684969497049714972497349744975497649774978497949804981498249834984498549864987498849894990499149924993499449954996499749984999500050015002500350045005500650075008500950105011501250135014501550165017501850195020502150225023502450255026502750285029503050315032503350345035503650375038503950405041504250435044504550465047504850495050505150525053505450555056505750585059506050615062506350645065506650675068506950705071507250735074507550765077507850795080508150825083508450855086508750885089509050915092509350945095509650975098509951005101510251035104510551065107510851095110511151125113511451155116511751185119512051215122512351245125512651275128512951305131513251335134513551365137513851395140514151425143514451455146514751485149515051515152515351545155515651575158515951605161516251635164516551665167516851695170517151725173517451755176517751785179518051815182518351845185518651875188518951905191519251935194519551965197519851995200520152025203520452055206520752085209521052115212521352145215521652175218521952205221522252235224522552265227522852295230523152325233523452355236523752385239524052415242524352445245524652475248524952505251525252535254525552565257525852595260526152625263526452655266526752685269527052715272527352745275527652775278527952805281528252835284528552865287528852895290529152925293529452955296529752985299530053015302530353045305530653075308530953105311531253135314531553165317531853195320532153225323532453255326532753285329533053315332533353345335533653375338533953405341534253435344534553465347534853495350535153525353535453555356535753585359536053615362536353645365536653675368536953705371537253735374537553765377537853795380538153825383538453855386538753885389539053915392539353945395539653975398539954005401540254035404540554065407540854095410541154125413541454155416541754185419542054215422542354245425542654275428542954305431543254335434543554365437543854395440544154425443544454455446544754485449545054515452545354545455545654575458545954605461546254635464546554665467546854695470547154725473547454755476547754785479548054815482548354845485548654875488548954905491549254935494549554965497549854995500550155025503550455055506550755085509551055115512551355145515551655175518551955205521552255235524552555265527
  1. gb_internal lbValue lb_emit_arith_matrix(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type, bool component_wise);
  2. gb_internal lbValue lb_emit_logical_binary_expr(lbProcedure *p, TokenKind op, Ast *left, Ast *right, Type *final_type) {
  3. lbModule *m = p->module;
  4. lbBlock *rhs = lb_create_block(p, "logical.cmp.rhs");
  5. lbBlock *done = lb_create_block(p, "logical.cmp.done");
  6. lbValue short_circuit = {};
  7. if (op == Token_CmpAnd) {
  8. lb_build_cond(p, left, rhs, done);
  9. short_circuit = lb_const_bool(m, t_llvm_bool, false);
  10. } else if (op == Token_CmpOr) {
  11. lb_build_cond(p, left, done, rhs);
  12. short_circuit = lb_const_bool(m, t_llvm_bool, true);
  13. }
  14. if (rhs->preds.count == 0) {
  15. lb_start_block(p, done);
  16. return short_circuit;
  17. }
  18. if (done->preds.count == 0) {
  19. lb_start_block(p, rhs);
  20. if (lb_is_expr_untyped_const(right)) {
  21. return lb_expr_untyped_const_to_typed(m, right, default_type(final_type));
  22. }
  23. return lb_build_expr(p, right);
  24. }
  25. Array<LLVMValueRef> incoming_values = {};
  26. Array<LLVMBasicBlockRef> incoming_blocks = {};
  27. array_init(&incoming_values, heap_allocator(), done->preds.count+1);
  28. array_init(&incoming_blocks, heap_allocator(), done->preds.count+1);
  29. for_array(i, done->preds) {
  30. incoming_values[i] = short_circuit.value;
  31. incoming_blocks[i] = done->preds[i]->block;
  32. }
  33. lb_start_block(p, rhs);
  34. lbValue edge = {};
  35. if (lb_is_expr_untyped_const(right)) {
  36. edge = lb_expr_untyped_const_to_typed(m, right, t_llvm_bool);
  37. } else {
  38. edge = lb_emit_conv(p, lb_build_expr(p, right), t_llvm_bool);
  39. }
  40. GB_ASSERT(edge.type == t_llvm_bool);
  41. incoming_values[done->preds.count] = edge.value;
  42. incoming_blocks[done->preds.count] = p->curr_block->block;
  43. lb_emit_jump(p, done);
  44. lb_start_block(p, done);
  45. LLVMTypeRef dst_type = lb_type(m, t_llvm_bool);
  46. LLVMValueRef phi = nullptr;
  47. GB_ASSERT(incoming_values.count == incoming_blocks.count);
  48. GB_ASSERT(incoming_values.count > 0);
  49. LLVMTypeRef phi_type = nullptr;
  50. for (LLVMValueRef incoming_value : incoming_values) {
  51. if (!LLVMIsConstant(incoming_value)) {
  52. phi_type = LLVMTypeOf(incoming_value);
  53. break;
  54. }
  55. }
  56. lbValue res = {};
  57. if (phi_type == nullptr) {
  58. phi = LLVMBuildPhi(p->builder, dst_type, "");
  59. LLVMAddIncoming(phi, incoming_values.data, incoming_blocks.data, cast(unsigned)incoming_values.count);
  60. res.value = phi;
  61. res.type = t_llvm_bool;
  62. } else {
  63. for_array(i, incoming_values) {
  64. LLVMValueRef incoming_value = incoming_values[i];
  65. LLVMTypeRef incoming_type = LLVMTypeOf(incoming_value);
  66. if (phi_type != incoming_type) {
  67. GB_ASSERT_MSG(LLVMIsConstant(incoming_value), "%s vs %s", LLVMPrintTypeToString(phi_type), LLVMPrintTypeToString(incoming_type));
  68. bool ok = !!LLVMConstIntGetZExtValue(incoming_value);
  69. incoming_values[i] = LLVMConstInt(phi_type, ok, false);
  70. }
  71. }
  72. // NOTE(bill): this now only uses i1 for the logic to prevent issues with corrupted booleans which are not of value 0 or 1 (e.g. 2)
  73. // Doing this may produce slightly worse code as a result but it will be correct behaviour
  74. phi = LLVMBuildPhi(p->builder, phi_type, "");
  75. LLVMAddIncoming(phi, incoming_values.data, incoming_blocks.data, cast(unsigned)incoming_values.count);
  76. res.value = phi;
  77. res.type = t_llvm_bool;
  78. }
  79. return lb_emit_conv(p, res, default_type(final_type));
  80. }
  81. gb_internal lbValue lb_emit_unary_arith(lbProcedure *p, TokenKind op, lbValue x, Type *type) {
  82. switch (op) {
  83. case Token_Add:
  84. return x;
  85. case Token_Not: // Boolean not
  86. case Token_Xor: // Bitwise not
  87. case Token_Sub: // Number negation
  88. break;
  89. case Token_Pointer:
  90. GB_PANIC("This should be handled elsewhere");
  91. break;
  92. }
  93. if (is_type_array_like(x.type)) {
  94. // IMPORTANT TODO(bill): This is very wasteful with regards to stack memory
  95. Type *tl = base_type(x.type);
  96. lbValue val = lb_address_from_load_or_generate_local(p, x);
  97. GB_ASSERT(is_type_array_like(type));
  98. Type *elem_type = base_array_type(type);
  99. // NOTE(bill): Doesn't need to be zero because it will be initialized in the loops
  100. lbAddr res_addr = lb_add_local(p, type, nullptr, false, true);
  101. lbValue res = lb_addr_get_ptr(p, res_addr);
  102. bool inline_array_arith = lb_can_try_to_inline_array_arith(type);
  103. i32 count = cast(i32)get_array_type_count(tl);
  104. LLVMTypeRef vector_type = nullptr;
  105. if (op != Token_Not && lb_try_vector_cast(p->module, val, &vector_type)) {
  106. LLVMValueRef vp = LLVMBuildPointerCast(p->builder, val.value, LLVMPointerType(vector_type, 0), "");
  107. LLVMValueRef v = OdinLLVMBuildLoad(p, vector_type, vp);
  108. LLVMValueRef opv = nullptr;
  109. switch (op) {
  110. case Token_Xor:
  111. opv = LLVMBuildNot(p->builder, v, "");
  112. if (is_type_bit_set(elem_type)) {
  113. ExactValue ev_mask = exact_bit_set_all_set_mask(elem_type);
  114. lbValue mask = lb_const_value(p->module, elem_type, ev_mask);
  115. opv = LLVMBuildAnd(p->builder, opv, mask.value, "");
  116. }
  117. break;
  118. case Token_Sub:
  119. if (is_type_float(elem_type)) {
  120. opv = LLVMBuildFNeg(p->builder, v, "");
  121. } else {
  122. opv = LLVMBuildNeg(p->builder, v, "");
  123. }
  124. break;
  125. }
  126. if (opv != nullptr) {
  127. LLVMSetAlignment(res.value, cast(unsigned)lb_alignof(vector_type));
  128. LLVMValueRef res_ptr = LLVMBuildPointerCast(p->builder, res.value, LLVMPointerType(vector_type, 0), "");
  129. LLVMBuildStore(p->builder, opv, res_ptr);
  130. return lb_emit_conv(p, lb_emit_load(p, res), type);
  131. }
  132. }
  133. if (inline_array_arith) {
  134. // inline
  135. for (i32 i = 0; i < count; i++) {
  136. lbValue e = lb_emit_load(p, lb_emit_array_epi(p, val, i));
  137. lbValue z = lb_emit_unary_arith(p, op, e, elem_type);
  138. lb_emit_store(p, lb_emit_array_epi(p, res, i), z);
  139. }
  140. } else {
  141. auto loop_data = lb_loop_start(p, count, t_i32);
  142. lbValue e = lb_emit_load(p, lb_emit_array_ep(p, val, loop_data.idx));
  143. lbValue z = lb_emit_unary_arith(p, op, e, elem_type);
  144. lb_emit_store(p, lb_emit_array_ep(p, res, loop_data.idx), z);
  145. lb_loop_end(p, loop_data);
  146. }
  147. return lb_emit_load(p, res);
  148. }
  149. if (op == Token_Xor) {
  150. lbValue cmp = {};
  151. cmp.type = x.type;
  152. if (is_type_bit_set(x.type)) {
  153. ExactValue ev_mask = exact_bit_set_all_set_mask(x.type);
  154. lbValue mask = lb_const_value(p->module, x.type, ev_mask);
  155. cmp.value = LLVMBuildXor(p->builder, x.value, mask.value, "");
  156. } else {
  157. cmp.value = LLVMBuildNot(p->builder, x.value, "");
  158. }
  159. return lb_emit_conv(p, cmp, type);
  160. }
  161. if (op == Token_Not) {
  162. lbValue cmp = {};
  163. LLVMValueRef zero = LLVMConstInt(lb_type(p->module, x.type), 0, false);
  164. cmp.value = LLVMBuildICmp(p->builder, LLVMIntEQ, x.value, zero, "");
  165. cmp.type = t_llvm_bool;
  166. return lb_emit_conv(p, cmp, type);
  167. }
  168. if (op == Token_Sub && is_type_integer(type) && is_type_different_to_arch_endianness(type)) {
  169. Type *platform_type = integer_endian_type_to_platform_type(type);
  170. lbValue v = lb_emit_byte_swap(p, x, platform_type);
  171. lbValue res = {};
  172. res.value = LLVMBuildNeg(p->builder, v.value, "");
  173. res.type = platform_type;
  174. return lb_emit_byte_swap(p, res, type);
  175. }
  176. if (op == Token_Sub && is_type_float(type) && is_type_different_to_arch_endianness(type)) {
  177. Type *platform_type = integer_endian_type_to_platform_type(type);
  178. lbValue v = lb_emit_byte_swap(p, x, platform_type);
  179. lbValue res = {};
  180. res.value = LLVMBuildFNeg(p->builder, v.value, "");
  181. res.type = platform_type;
  182. return lb_emit_byte_swap(p, res, type);
  183. }
  184. lbValue res = {};
  185. switch (op) {
  186. case Token_Not: // Boolean not
  187. case Token_Xor: // Bitwise not
  188. res.value = LLVMBuildNot(p->builder, x.value, "");
  189. res.type = x.type;
  190. return res;
  191. case Token_Sub: // Number negation
  192. if (is_type_integer(x.type)) {
  193. res.value = LLVMBuildNeg(p->builder, x.value, "");
  194. } else if (is_type_float(x.type)) {
  195. res.value = LLVMBuildFNeg(p->builder, x.value, "");
  196. } else if (is_type_complex(x.type)) {
  197. LLVMValueRef v0 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 0, ""), "");
  198. LLVMValueRef v1 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 1, ""), "");
  199. lbAddr addr = lb_add_local_generated(p, x.type, false);
  200. LLVMTypeRef type = llvm_addr_type(p->module, addr.addr);
  201. LLVMBuildStore(p->builder, v0, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 0, ""));
  202. LLVMBuildStore(p->builder, v1, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 1, ""));
  203. return lb_addr_load(p, addr);
  204. } else if (is_type_quaternion(x.type)) {
  205. LLVMValueRef v0 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 0, ""), "");
  206. LLVMValueRef v1 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 1, ""), "");
  207. LLVMValueRef v2 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 2, ""), "");
  208. LLVMValueRef v3 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 3, ""), "");
  209. lbAddr addr = lb_add_local_generated(p, x.type, false);
  210. LLVMTypeRef type = llvm_addr_type(p->module, addr.addr);
  211. LLVMBuildStore(p->builder, v0, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 0, ""));
  212. LLVMBuildStore(p->builder, v1, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 1, ""));
  213. LLVMBuildStore(p->builder, v2, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 2, ""));
  214. LLVMBuildStore(p->builder, v3, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 3, ""));
  215. return lb_addr_load(p, addr);
  216. } else if (is_type_simd_vector(x.type)) {
  217. Type *elem = base_array_type(x.type);
  218. if (is_type_float(elem)) {
  219. res.value = LLVMBuildFNeg(p->builder, x.value, "");
  220. } else {
  221. res.value = LLVMBuildNeg(p->builder, x.value, "");
  222. }
  223. } else if (is_type_matrix(x.type)) {
  224. lbValue zero = {};
  225. zero.value = LLVMConstNull(lb_type(p->module, type));
  226. zero.type = type;
  227. return lb_emit_arith_matrix(p, Token_Sub, zero, x, type, true);
  228. } else {
  229. GB_PANIC("Unhandled type %s", type_to_string(x.type));
  230. }
  231. res.type = x.type;
  232. return res;
  233. }
  234. return res;
  235. }
  236. gb_internal bool lb_try_direct_vector_arith(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type, lbValue *res_) {
  237. GB_ASSERT(is_type_array_like(type));
  238. Type *elem_type = base_array_type(type);
  239. // NOTE(bill): Shift operations cannot be easily dealt with due to Odin's semantics
  240. if (op == Token_Shl || op == Token_Shr) {
  241. return false;
  242. }
  243. if (!LLVMIsALoadInst(lhs.value) || !LLVMIsALoadInst(rhs.value)) {
  244. return false;
  245. }
  246. lbValue lhs_ptr = {};
  247. lbValue rhs_ptr = {};
  248. lhs_ptr.value = LLVMGetOperand(lhs.value, 0);
  249. lhs_ptr.type = alloc_type_pointer(lhs.type);
  250. rhs_ptr.value = LLVMGetOperand(rhs.value, 0);
  251. rhs_ptr.type = alloc_type_pointer(rhs.type);
  252. LLVMTypeRef vector_type0 = nullptr;
  253. LLVMTypeRef vector_type1 = nullptr;
  254. if (lb_try_vector_cast(p->module, lhs_ptr, &vector_type0) &&
  255. lb_try_vector_cast(p->module, rhs_ptr, &vector_type1)) {
  256. GB_ASSERT(vector_type0 == vector_type1);
  257. LLVMTypeRef vector_type = vector_type0;
  258. Type *integral_type = base_type(elem_type);
  259. if (is_type_simd_vector(integral_type)) {
  260. integral_type = core_array_type(integral_type);
  261. }
  262. if (is_type_bit_set(integral_type)) {
  263. switch (op) {
  264. case Token_Add: op = Token_Or; break;
  265. case Token_Sub: op = Token_AndNot; break;
  266. }
  267. Type *u = bit_set_to_int(type);
  268. if (is_type_array(u)) {
  269. return false;
  270. }
  271. }
  272. LLVMValueRef lhs_vp = LLVMBuildPointerCast(p->builder, lhs_ptr.value, LLVMPointerType(vector_type, 0), "");
  273. LLVMValueRef rhs_vp = LLVMBuildPointerCast(p->builder, rhs_ptr.value, LLVMPointerType(vector_type, 0), "");
  274. LLVMValueRef x = OdinLLVMBuildLoad(p, vector_type, lhs_vp);
  275. LLVMValueRef y = OdinLLVMBuildLoad(p, vector_type, rhs_vp);
  276. LLVMValueRef z = nullptr;
  277. if (is_type_float(integral_type)) {
  278. switch (op) {
  279. case Token_Add:
  280. z = LLVMBuildFAdd(p->builder, x, y, "");
  281. break;
  282. case Token_Sub:
  283. z = LLVMBuildFSub(p->builder, x, y, "");
  284. break;
  285. case Token_Mul:
  286. z = LLVMBuildFMul(p->builder, x, y, "");
  287. break;
  288. case Token_Quo:
  289. z = LLVMBuildFDiv(p->builder, x, y, "");
  290. break;
  291. case Token_Mod:
  292. z = LLVMBuildFRem(p->builder, x, y, "");
  293. break;
  294. default:
  295. GB_PANIC("Unsupported vector operation %.*s", LIT(token_strings[op]));
  296. break;
  297. }
  298. } else {
  299. switch (op) {
  300. case Token_Add:
  301. z = LLVMBuildAdd(p->builder, x, y, "");
  302. break;
  303. case Token_Sub:
  304. z = LLVMBuildSub(p->builder, x, y, "");
  305. break;
  306. case Token_Mul:
  307. z = LLVMBuildMul(p->builder, x, y, "");
  308. break;
  309. case Token_Quo:
  310. if (is_type_unsigned(integral_type)) {
  311. z = LLVMBuildUDiv(p->builder, x, y, "");
  312. } else {
  313. z = LLVMBuildSDiv(p->builder, x, y, "");
  314. }
  315. break;
  316. case Token_Mod:
  317. if (is_type_unsigned(integral_type)) {
  318. z = LLVMBuildURem(p->builder, x, y, "");
  319. } else {
  320. z = LLVMBuildSRem(p->builder, x, y, "");
  321. }
  322. break;
  323. case Token_ModMod:
  324. if (is_type_unsigned(integral_type)) {
  325. z = LLVMBuildURem(p->builder, x, y, "");
  326. } else {
  327. LLVMValueRef a = LLVMBuildSRem(p->builder, x, y, "");
  328. LLVMValueRef b = LLVMBuildAdd(p->builder, a, y, "");
  329. z = LLVMBuildSRem(p->builder, b, y, "");
  330. }
  331. break;
  332. case Token_And:
  333. z = LLVMBuildAnd(p->builder, x, y, "");
  334. break;
  335. case Token_AndNot:
  336. z = LLVMBuildAnd(p->builder, x, LLVMBuildNot(p->builder, y, ""), "");
  337. break;
  338. case Token_Or:
  339. z = LLVMBuildOr(p->builder, x, y, "");
  340. break;
  341. case Token_Xor:
  342. z = LLVMBuildXor(p->builder, x, y, "");
  343. break;
  344. default:
  345. GB_PANIC("Unsupported vector operation");
  346. break;
  347. }
  348. }
  349. if (z != nullptr) {
  350. lbAddr res = lb_add_local_generated_temp(p, type, lb_alignof(vector_type));
  351. LLVMValueRef vp = LLVMBuildPointerCast(p->builder, res.addr.value, LLVMPointerType(vector_type, 0), "");
  352. LLVMBuildStore(p->builder, z, vp);
  353. lbValue v = lb_addr_load(p, res);
  354. if (res_) *res_ = v;
  355. return true;
  356. }
  357. }
  358. return false;
  359. }
  360. gb_internal lbValue lb_emit_arith_array(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type) {
  361. GB_ASSERT(is_type_array_like(lhs.type) || is_type_array_like(rhs.type));
  362. lhs = lb_emit_conv(p, lhs, type);
  363. rhs = lb_emit_conv(p, rhs, type);
  364. GB_ASSERT(is_type_array_like(type));
  365. Type *elem_type = base_array_type(type);
  366. i64 count = get_array_type_count(type);
  367. unsigned n = cast(unsigned)count;
  368. // NOTE(bill, 2021-06-12): Try to do a direct operation as a vector, if possible
  369. lbValue direct_vector_res = {};
  370. if (lb_try_direct_vector_arith(p, op, lhs, rhs, type, &direct_vector_res)) {
  371. return direct_vector_res;
  372. }
  373. bool inline_array_arith = lb_can_try_to_inline_array_arith(type);
  374. if (inline_array_arith) {
  375. auto dst_ptrs = slice_make<lbValue>(temporary_allocator(), n);
  376. auto a_loads = slice_make<lbValue>(temporary_allocator(), n);
  377. auto b_loads = slice_make<lbValue>(temporary_allocator(), n);
  378. auto c_ops = slice_make<lbValue>(temporary_allocator(), n);
  379. for (unsigned i = 0; i < n; i++) {
  380. a_loads[i].value = LLVMBuildExtractValue(p->builder, lhs.value, i, "");
  381. a_loads[i].type = elem_type;
  382. }
  383. for (unsigned i = 0; i < n; i++) {
  384. b_loads[i].value = LLVMBuildExtractValue(p->builder, rhs.value, i, "");
  385. b_loads[i].type = elem_type;
  386. }
  387. for (unsigned i = 0; i < n; i++) {
  388. c_ops[i] = lb_emit_arith(p, op, a_loads[i], b_loads[i], elem_type);
  389. }
  390. lbAddr res = lb_add_local_generated(p, type, false);
  391. for (unsigned i = 0; i < n; i++) {
  392. dst_ptrs[i] = lb_emit_array_epi(p, res.addr, i);
  393. }
  394. for (unsigned i = 0; i < n; i++) {
  395. lb_emit_store(p, dst_ptrs[i], c_ops[i]);
  396. }
  397. return lb_addr_load(p, res);
  398. } else {
  399. lbValue x = lb_address_from_load_or_generate_local(p, lhs);
  400. lbValue y = lb_address_from_load_or_generate_local(p, rhs);
  401. lbAddr res = lb_add_local_generated(p, type, false);
  402. auto loop_data = lb_loop_start(p, cast(isize)count, t_i32);
  403. lbValue a_ptr = lb_emit_array_ep(p, x, loop_data.idx);
  404. lbValue b_ptr = lb_emit_array_ep(p, y, loop_data.idx);
  405. lbValue dst_ptr = lb_emit_array_ep(p, res.addr, loop_data.idx);
  406. lbValue a = lb_emit_load(p, a_ptr);
  407. lbValue b = lb_emit_load(p, b_ptr);
  408. lbValue c = lb_emit_arith(p, op, a, b, elem_type);
  409. lb_emit_store(p, dst_ptr, c);
  410. lb_loop_end(p, loop_data);
  411. return lb_addr_load(p, res);
  412. }
  413. }
  414. gb_internal bool lb_is_matrix_simdable(Type *t) {
  415. Type *mt = base_type(t);
  416. GB_ASSERT(mt->kind == Type_Matrix);
  417. Type *elem = core_type(mt->Matrix.elem);
  418. if (is_type_complex(elem)) {
  419. return false;
  420. }
  421. if (is_type_different_to_arch_endianness(elem)) {
  422. return false;
  423. }
  424. switch (build_context.metrics.arch) {
  425. default:
  426. return false;
  427. case TargetArch_amd64:
  428. case TargetArch_arm64:
  429. break;
  430. }
  431. if (type_align_of(t) < 16) {
  432. // it's not aligned well enough to use the vector instructions
  433. return false;
  434. }
  435. if ((mt->Matrix.row_count & 1) ^ (mt->Matrix.column_count & 1)) {
  436. return false;
  437. }
  438. if (mt->Matrix.is_row_major) {
  439. // TODO(bill): make #row_major matrices work with SIMD
  440. return false;
  441. }
  442. if (elem->kind == Type_Basic) {
  443. switch (elem->Basic.kind) {
  444. case Basic_f16:
  445. case Basic_f16le:
  446. case Basic_f16be:
  447. switch (build_context.metrics.arch) {
  448. case TargetArch_amd64:
  449. return false;
  450. case TargetArch_arm64:
  451. // TODO(bill): determine when this is fine
  452. return true;
  453. case TargetArch_i386:
  454. case TargetArch_wasm32:
  455. case TargetArch_wasm64p32:
  456. return false;
  457. }
  458. }
  459. }
  460. return true;
  461. }
  462. gb_internal LLVMValueRef lb_matrix_to_vector(lbProcedure *p, lbValue matrix) {
  463. Type *mt = base_type(matrix.type);
  464. GB_ASSERT(mt->kind == Type_Matrix);
  465. LLVMTypeRef elem_type = lb_type(p->module, mt->Matrix.elem);
  466. unsigned total_count = cast(unsigned)matrix_type_total_internal_elems(mt);
  467. LLVMTypeRef total_matrix_type = LLVMVectorType(elem_type, total_count);
  468. #if 1
  469. LLVMValueRef ptr = lb_address_from_load_or_generate_local(p, matrix).value;
  470. LLVMValueRef matrix_vector_ptr = LLVMBuildPointerCast(p->builder, ptr, LLVMPointerType(total_matrix_type, 0), "");
  471. LLVMValueRef matrix_vector = OdinLLVMBuildLoadAligned(p, total_matrix_type, matrix_vector_ptr, type_align_of(mt));
  472. return matrix_vector;
  473. #else
  474. LLVMValueRef matrix_vector = LLVMBuildBitCast(p->builder, matrix.value, total_matrix_type, "");
  475. return matrix_vector;
  476. #endif
  477. }
  478. gb_internal LLVMValueRef lb_matrix_trimmed_vector_mask(lbProcedure *p, Type *mt) {
  479. mt = base_type(mt);
  480. GB_ASSERT(mt->kind == Type_Matrix);
  481. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  482. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  483. unsigned column_count = cast(unsigned)mt->Matrix.column_count;
  484. unsigned mask_elems_index = 0;
  485. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), row_count*column_count);
  486. for (unsigned j = 0; j < column_count; j++) {
  487. for (unsigned i = 0; i < row_count; i++) {
  488. unsigned offset = stride*j + i;
  489. mask_elems[mask_elems_index++] = lb_const_int(p->module, t_u32, offset).value;
  490. }
  491. }
  492. LLVMValueRef mask = LLVMConstVector(mask_elems.data, cast(unsigned)mask_elems.count);
  493. return mask;
  494. }
  495. gb_internal LLVMValueRef lb_matrix_to_trimmed_vector(lbProcedure *p, lbValue m) {
  496. LLVMValueRef vector = lb_matrix_to_vector(p, m);
  497. Type *mt = base_type(m.type);
  498. GB_ASSERT(mt->kind == Type_Matrix);
  499. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  500. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  501. if (stride == row_count) {
  502. return vector;
  503. }
  504. LLVMValueRef mask = lb_matrix_trimmed_vector_mask(p, mt);
  505. LLVMValueRef trimmed_vector = llvm_basic_shuffle(p, vector, mask);
  506. return trimmed_vector;
  507. }
  508. gb_internal lbValue lb_emit_matrix_tranpose(lbProcedure *p, lbValue m, Type *type) {
  509. if (is_type_array(m.type)) {
  510. i32 rank = type_math_rank(m.type);
  511. if (rank == 2) {
  512. lbAddr addr = lb_add_local_generated(p, type, false);
  513. lbValue dst = addr.addr;
  514. lbValue src = m;
  515. i32 n = cast(i32)get_array_type_count(m.type);
  516. i32 m = cast(i32)get_array_type_count(type);
  517. // m.type == [n][m]T
  518. // type == [m][n]T
  519. for (i32 j = 0; j < m; j++) {
  520. lbValue dst_col = lb_emit_struct_ep(p, dst, j);
  521. for (i32 i = 0; i < n; i++) {
  522. lbValue dst_row = lb_emit_struct_ep(p, dst_col, i);
  523. lbValue src_col = lb_emit_struct_ev(p, src, i);
  524. lbValue src_row = lb_emit_struct_ev(p, src_col, j);
  525. lb_emit_store(p, dst_row, src_row);
  526. }
  527. }
  528. return lb_addr_load(p, addr);
  529. }
  530. // no-op
  531. m.type = type;
  532. return m;
  533. }
  534. Type *mt = base_type(m.type);
  535. GB_ASSERT(mt->kind == Type_Matrix);
  536. if (lb_is_matrix_simdable(mt)) {
  537. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  538. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  539. unsigned column_count = cast(unsigned)mt->Matrix.column_count;
  540. auto rows = slice_make<LLVMValueRef>(permanent_allocator(), row_count);
  541. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  542. LLVMValueRef vector = lb_matrix_to_vector(p, m);
  543. for (unsigned i = 0; i < row_count; i++) {
  544. for (unsigned j = 0; j < column_count; j++) {
  545. unsigned offset = stride*j + i;
  546. mask_elems[j] = lb_const_int(p->module, t_u32, offset).value;
  547. }
  548. // transpose mask
  549. LLVMValueRef mask = LLVMConstVector(mask_elems.data, column_count);
  550. LLVMValueRef row = llvm_basic_shuffle(p, vector, mask);
  551. rows[i] = row;
  552. }
  553. lbAddr res = lb_add_local_generated(p, type, true);
  554. for_array(i, rows) {
  555. LLVMValueRef row = rows[i];
  556. lbValue dst_row_ptr = lb_emit_matrix_epi(p, res.addr, 0, i);
  557. LLVMValueRef ptr = dst_row_ptr.value;
  558. ptr = LLVMBuildPointerCast(p->builder, ptr, LLVMPointerType(LLVMTypeOf(row), 0), "");
  559. LLVMBuildStore(p->builder, row, ptr);
  560. }
  561. return lb_addr_load(p, res);
  562. }
  563. lbAddr res = lb_add_local_generated(p, type, true);
  564. i64 row_count = mt->Matrix.row_count;
  565. i64 column_count = mt->Matrix.column_count;
  566. for (i64 j = 0; j < column_count; j++) {
  567. for (i64 i = 0; i < row_count; i++) {
  568. lbValue src = lb_emit_matrix_ev(p, m, i, j);
  569. lbValue dst = lb_emit_matrix_epi(p, res.addr, j, i);
  570. lb_emit_store(p, dst, src);
  571. }
  572. }
  573. return lb_addr_load(p, res);
  574. }
  575. gb_internal lbValue lb_matrix_cast_vector_to_type(lbProcedure *p, LLVMValueRef vector, Type *type) {
  576. lbAddr res = lb_add_local_generated(p, type, true);
  577. LLVMValueRef res_ptr = res.addr.value;
  578. unsigned alignment = cast(unsigned)gb_max(type_align_of(type), lb_alignof(LLVMTypeOf(vector)));
  579. LLVMSetAlignment(res_ptr, alignment);
  580. res_ptr = LLVMBuildPointerCast(p->builder, res_ptr, LLVMPointerType(LLVMTypeOf(vector), 0), "");
  581. LLVMBuildStore(p->builder, vector, res_ptr);
  582. return lb_addr_load(p, res);
  583. }
  584. gb_internal lbValue lb_emit_matrix_flatten(lbProcedure *p, lbValue m, Type *type) {
  585. if (is_type_array(m.type)) {
  586. // no-op
  587. m.type = type;
  588. return m;
  589. }
  590. Type *mt = base_type(m.type);
  591. GB_ASSERT(mt->kind == Type_Matrix);
  592. lbAddr res = lb_add_local_generated(p, type, true);
  593. GB_ASSERT(type_size_of(type) == type_size_of(m.type));
  594. lbValue m_ptr = lb_address_from_load_or_generate_local(p, m);
  595. lbValue n = lb_const_int(p->module, t_int, type_size_of(type));
  596. lb_mem_copy_non_overlapping(p, res.addr, m_ptr, n);
  597. // i64 row_count = mt->Matrix.row_count;
  598. // i64 column_count = mt->Matrix.column_count;
  599. // TEMPORARY_ALLOCATOR_GUARD();
  600. // auto srcs = array_make<lbValue>(temporary_allocator(), 0, row_count*column_count);
  601. // auto dsts = array_make<lbValue>(temporary_allocator(), 0, row_count*column_count);
  602. // for (i64 j = 0; j < column_count; j++) {
  603. // for (i64 i = 0; i < row_count; i++) {
  604. // lbValue src = lb_emit_matrix_ev(p, m, i, j);
  605. // array_add(&srcs, src);
  606. // }
  607. // }
  608. // for (i64 j = 0; j < column_count; j++) {
  609. // for (i64 i = 0; i < row_count; i++) {
  610. // lbValue dst = lb_emit_array_epi(p, res.addr, i + j*row_count);
  611. // array_add(&dsts, dst);
  612. // }
  613. // }
  614. // GB_ASSERT(srcs.count == dsts.count);
  615. // for_array(i, srcs) {
  616. // lb_emit_store(p, dsts[i], srcs[i]);
  617. // }
  618. return lb_addr_load(p, res);
  619. }
  620. gb_internal lbValue lb_emit_outer_product(lbProcedure *p, lbValue a, lbValue b, Type *type) {
  621. Type *mt = base_type(type);
  622. Type *at = base_type(a.type);
  623. Type *bt = base_type(b.type);
  624. GB_ASSERT(mt->kind == Type_Matrix);
  625. GB_ASSERT(at->kind == Type_Array);
  626. GB_ASSERT(bt->kind == Type_Array);
  627. i64 row_count = mt->Matrix.row_count;
  628. i64 column_count = mt->Matrix.column_count;
  629. GB_ASSERT(row_count == at->Array.count);
  630. GB_ASSERT(column_count == bt->Array.count);
  631. lbAddr res = lb_add_local_generated(p, type, true);
  632. for (i64 j = 0; j < column_count; j++) {
  633. for (i64 i = 0; i < row_count; i++) {
  634. lbValue x = lb_emit_struct_ev(p, a, cast(i32)i);
  635. lbValue y = lb_emit_struct_ev(p, b, cast(i32)j);
  636. lbValue src = lb_emit_arith(p, Token_Mul, x, y, mt->Matrix.elem);
  637. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  638. lb_emit_store(p, dst, src);
  639. }
  640. }
  641. return lb_addr_load(p, res);
  642. }
  643. gb_internal lbValue lb_emit_matrix_mul(lbProcedure *p, lbValue lhs, lbValue rhs, Type *type) {
  644. // TODO(bill): Handle edge case for f16 types on x86(-64) platforms
  645. Type *xt = base_type(lhs.type);
  646. Type *yt = base_type(rhs.type);
  647. GB_ASSERT(is_type_matrix(type));
  648. GB_ASSERT(is_type_matrix(xt));
  649. GB_ASSERT(is_type_matrix(yt));
  650. GB_ASSERT(xt->Matrix.column_count == yt->Matrix.row_count);
  651. GB_ASSERT(are_types_identical(xt->Matrix.elem, yt->Matrix.elem));
  652. GB_ASSERT(xt->Matrix.is_row_major == yt->Matrix.is_row_major);
  653. Type *elem = xt->Matrix.elem;
  654. unsigned outer_rows = cast(unsigned)xt->Matrix.row_count;
  655. unsigned inner = cast(unsigned)xt->Matrix.column_count;
  656. unsigned outer_columns = cast(unsigned)yt->Matrix.column_count;
  657. if (!xt->Matrix.is_row_major && lb_is_matrix_simdable(xt)) {
  658. unsigned x_stride = cast(unsigned)matrix_type_stride_in_elems(xt);
  659. unsigned y_stride = cast(unsigned)matrix_type_stride_in_elems(yt);
  660. auto x_rows = slice_make<LLVMValueRef>(permanent_allocator(), outer_rows);
  661. auto y_columns = slice_make<LLVMValueRef>(permanent_allocator(), outer_columns);
  662. LLVMValueRef x_vector = lb_matrix_to_vector(p, lhs);
  663. LLVMValueRef y_vector = lb_matrix_to_vector(p, rhs);
  664. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), inner);
  665. for (unsigned i = 0; i < outer_rows; i++) {
  666. for (unsigned j = 0; j < inner; j++) {
  667. unsigned offset = x_stride*j + i;
  668. mask_elems[j] = lb_const_int(p->module, t_u32, offset).value;
  669. }
  670. // transpose mask
  671. LLVMValueRef mask = LLVMConstVector(mask_elems.data, inner);
  672. LLVMValueRef row = llvm_basic_shuffle(p, x_vector, mask);
  673. x_rows[i] = row;
  674. }
  675. for (unsigned i = 0; i < outer_columns; i++) {
  676. LLVMValueRef mask = llvm_mask_iota(p->module, y_stride*i, inner);
  677. LLVMValueRef column = llvm_basic_shuffle(p, y_vector, mask);
  678. y_columns[i] = column;
  679. }
  680. lbAddr res = lb_add_local_generated(p, type, true);
  681. for_array(i, x_rows) {
  682. LLVMValueRef x_row = x_rows[i];
  683. for_array(j, y_columns) {
  684. LLVMValueRef y_column = y_columns[j];
  685. LLVMValueRef elem = llvm_vector_dot(p, x_row, y_column);
  686. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  687. LLVMBuildStore(p->builder, elem, dst.value);
  688. }
  689. }
  690. return lb_addr_load(p, res);
  691. }
  692. if (!xt->Matrix.is_row_major) {
  693. lbAddr res = lb_add_local_generated(p, type, true);
  694. auto inners = slice_make<lbValue[2]>(permanent_allocator(), inner);
  695. for (unsigned j = 0; j < outer_columns; j++) {
  696. for (unsigned i = 0; i < outer_rows; i++) {
  697. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  698. for (unsigned k = 0; k < inner; k++) {
  699. inners[k][0] = lb_emit_matrix_ev(p, lhs, i, k);
  700. inners[k][1] = lb_emit_matrix_ev(p, rhs, k, j);
  701. }
  702. lbValue sum = lb_const_nil(p->module, elem);
  703. for (unsigned k = 0; k < inner; k++) {
  704. lbValue a = inners[k][0];
  705. lbValue b = inners[k][1];
  706. sum = lb_emit_mul_add(p, a, b, sum, elem);
  707. }
  708. lb_emit_store(p, dst, sum);
  709. }
  710. }
  711. return lb_addr_load(p, res);
  712. } else {
  713. lbAddr res = lb_add_local_generated(p, type, true);
  714. auto inners = slice_make<lbValue[2]>(permanent_allocator(), inner);
  715. for (unsigned i = 0; i < outer_rows; i++) {
  716. for (unsigned j = 0; j < outer_columns; j++) {
  717. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  718. for (unsigned k = 0; k < inner; k++) {
  719. inners[k][0] = lb_emit_matrix_ev(p, lhs, i, k);
  720. inners[k][1] = lb_emit_matrix_ev(p, rhs, k, j);
  721. }
  722. lbValue sum = lb_const_nil(p->module, elem);
  723. for (unsigned k = 0; k < inner; k++) {
  724. lbValue a = inners[k][0];
  725. lbValue b = inners[k][1];
  726. sum = lb_emit_mul_add(p, a, b, sum, elem);
  727. }
  728. lb_emit_store(p, dst, sum);
  729. }
  730. }
  731. return lb_addr_load(p, res);
  732. }
  733. }
  734. gb_internal lbValue lb_emit_matrix_mul_vector(lbProcedure *p, lbValue lhs, lbValue rhs, Type *type) {
  735. // TODO(bill): Handle edge case for f16 types on x86(-64) platforms
  736. Type *mt = base_type(lhs.type);
  737. Type *vt = base_type(rhs.type);
  738. GB_ASSERT(is_type_matrix(mt));
  739. GB_ASSERT(is_type_array_like(vt));
  740. i64 vector_count = get_array_type_count(vt);
  741. GB_ASSERT(mt->Matrix.column_count == vector_count);
  742. GB_ASSERT(are_types_identical(mt->Matrix.elem, base_array_type(vt)));
  743. Type *elem = mt->Matrix.elem;
  744. if (!mt->Matrix.is_row_major && lb_is_matrix_simdable(mt)) {
  745. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  746. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  747. unsigned column_count = cast(unsigned)mt->Matrix.column_count;
  748. auto m_columns = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  749. auto v_rows = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  750. LLVMValueRef matrix_vector = lb_matrix_to_vector(p, lhs);
  751. for (unsigned column_index = 0; column_index < column_count; column_index++) {
  752. LLVMValueRef mask = llvm_mask_iota(p->module, stride*column_index, row_count);
  753. LLVMValueRef column = llvm_basic_shuffle(p, matrix_vector, mask);
  754. m_columns[column_index] = column;
  755. }
  756. for (unsigned row_index = 0; row_index < column_count; row_index++) {
  757. LLVMValueRef value = lb_emit_struct_ev(p, rhs, row_index).value;
  758. LLVMValueRef row = llvm_vector_broadcast(p, value, row_count);
  759. v_rows[row_index] = row;
  760. }
  761. GB_ASSERT(column_count > 0);
  762. LLVMValueRef vector = nullptr;
  763. for (i64 i = 0; i < column_count; i++) {
  764. if (i == 0) {
  765. vector = llvm_vector_mul(p, m_columns[i], v_rows[i]);
  766. } else {
  767. vector = llvm_vector_mul_add(p, m_columns[i], v_rows[i], vector);
  768. }
  769. }
  770. return lb_matrix_cast_vector_to_type(p, vector, type);
  771. }
  772. lbAddr res = lb_add_local_generated(p, type, true);
  773. for (i64 i = 0; i < mt->Matrix.row_count; i++) {
  774. for (i64 j = 0; j < mt->Matrix.column_count; j++) {
  775. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, 0);
  776. lbValue d0 = lb_emit_load(p, dst);
  777. lbValue a = lb_emit_matrix_ev(p, lhs, i, j);
  778. lbValue b = lb_emit_struct_ev(p, rhs, cast(i32)j);
  779. lbValue c = lb_emit_mul_add(p, a, b, d0, elem);
  780. lb_emit_store(p, dst, c);
  781. }
  782. }
  783. return lb_addr_load(p, res);
  784. }
  785. gb_internal lbValue lb_emit_vector_mul_matrix(lbProcedure *p, lbValue lhs, lbValue rhs, Type *type) {
  786. // TODO(bill): Handle edge case for f16 types on x86(-64) platforms
  787. Type *mt = base_type(rhs.type);
  788. Type *vt = base_type(lhs.type);
  789. GB_ASSERT(is_type_matrix(mt));
  790. GB_ASSERT(is_type_array_like(vt));
  791. i64 vector_count = get_array_type_count(vt);
  792. GB_ASSERT(vector_count == mt->Matrix.row_count);
  793. GB_ASSERT(are_types_identical(mt->Matrix.elem, base_array_type(vt)));
  794. Type *elem = mt->Matrix.elem;
  795. if (!mt->Matrix.is_row_major && lb_is_matrix_simdable(mt)) {
  796. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  797. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  798. unsigned column_count = cast(unsigned)mt->Matrix.column_count; gb_unused(column_count);
  799. auto m_columns = slice_make<LLVMValueRef>(permanent_allocator(), row_count);
  800. auto v_rows = slice_make<LLVMValueRef>(permanent_allocator(), row_count);
  801. LLVMValueRef matrix_vector = lb_matrix_to_vector(p, rhs);
  802. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  803. for (unsigned row_index = 0; row_index < row_count; row_index++) {
  804. for (unsigned column_index = 0; column_index < column_count; column_index++) {
  805. unsigned offset = row_index + column_index*stride;
  806. mask_elems[column_index] = lb_const_int(p->module, t_u32, offset).value;
  807. }
  808. // transpose mask
  809. LLVMValueRef mask = LLVMConstVector(mask_elems.data, column_count);
  810. LLVMValueRef column = llvm_basic_shuffle(p, matrix_vector, mask);
  811. m_columns[row_index] = column;
  812. }
  813. for (unsigned column_index = 0; column_index < row_count; column_index++) {
  814. LLVMValueRef value = lb_emit_struct_ev(p, lhs, column_index).value;
  815. LLVMValueRef row = llvm_vector_broadcast(p, value, column_count);
  816. v_rows[column_index] = row;
  817. }
  818. GB_ASSERT(row_count > 0);
  819. LLVMValueRef vector = nullptr;
  820. for (i64 i = 0; i < row_count; i++) {
  821. if (i == 0) {
  822. vector = llvm_vector_mul(p, v_rows[i], m_columns[i]);
  823. } else {
  824. vector = llvm_vector_mul_add(p, v_rows[i], m_columns[i], vector);
  825. }
  826. }
  827. lbAddr res = lb_add_local_generated(p, type, true);
  828. LLVMValueRef res_ptr = res.addr.value;
  829. unsigned alignment = cast(unsigned)gb_max(type_align_of(type), lb_alignof(LLVMTypeOf(vector)));
  830. LLVMSetAlignment(res_ptr, alignment);
  831. res_ptr = LLVMBuildPointerCast(p->builder, res_ptr, LLVMPointerType(LLVMTypeOf(vector), 0), "");
  832. LLVMBuildStore(p->builder, vector, res_ptr);
  833. return lb_addr_load(p, res);
  834. }
  835. lbAddr res = lb_add_local_generated(p, type, true);
  836. for (i64 j = 0; j < mt->Matrix.column_count; j++) {
  837. for (i64 k = 0; k < mt->Matrix.row_count; k++) {
  838. lbValue dst = lb_emit_matrix_epi(p, res.addr, 0, j);
  839. lbValue d0 = lb_emit_load(p, dst);
  840. lbValue a = lb_emit_struct_ev(p, lhs, cast(i32)k);
  841. lbValue b = lb_emit_matrix_ev(p, rhs, k, j);
  842. lbValue c = lb_emit_mul_add(p, a, b, d0, elem);
  843. lb_emit_store(p, dst, c);
  844. }
  845. }
  846. return lb_addr_load(p, res);
  847. }
  848. gb_internal lbValue lb_emit_arith_matrix(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type, bool component_wise) {
  849. GB_ASSERT(is_type_matrix(lhs.type) || is_type_matrix(rhs.type));
  850. if (op == Token_Mul && !component_wise) {
  851. Type *xt = base_type(lhs.type);
  852. Type *yt = base_type(rhs.type);
  853. if (xt->kind == Type_Matrix) {
  854. if (yt->kind == Type_Matrix) {
  855. return lb_emit_matrix_mul(p, lhs, rhs, type);
  856. } else if (is_type_array_like(yt)) {
  857. return lb_emit_matrix_mul_vector(p, lhs, rhs, type);
  858. }
  859. } else if (is_type_array_like(xt)) {
  860. GB_ASSERT(yt->kind == Type_Matrix);
  861. return lb_emit_vector_mul_matrix(p, lhs, rhs, type);
  862. } else {
  863. GB_ASSERT(xt->kind == Type_Basic);
  864. GB_ASSERT(yt->kind == Type_Matrix);
  865. GB_ASSERT(is_type_matrix(type));
  866. Type *array_type = alloc_type_array(yt->Matrix.elem, matrix_type_total_internal_elems(yt));
  867. GB_ASSERT(type_size_of(array_type) == type_size_of(yt));
  868. lbValue array_lhs = lb_emit_conv(p, lhs, array_type);
  869. lbValue array_rhs = rhs;
  870. array_rhs.type = array_type;
  871. lbValue array = lb_emit_arith(p, op, array_lhs, array_rhs, array_type);
  872. array.type = type;
  873. return array;
  874. }
  875. } else {
  876. if (is_type_matrix(lhs.type)) {
  877. rhs = lb_emit_conv(p, rhs, lhs.type);
  878. } else {
  879. lhs = lb_emit_conv(p, lhs, rhs.type);
  880. }
  881. Type *xt = base_type(lhs.type);
  882. Type *yt = base_type(rhs.type);
  883. GB_ASSERT_MSG(are_types_identical(xt, yt), "%s %.*s %s", type_to_string(lhs.type), LIT(token_strings[op]), type_to_string(rhs.type));
  884. GB_ASSERT(xt->kind == Type_Matrix);
  885. // element-wise arithmetic
  886. // pretend it is an array
  887. lbValue array_lhs = lhs;
  888. lbValue array_rhs = rhs;
  889. Type *array_type = alloc_type_array(xt->Matrix.elem, matrix_type_total_internal_elems(xt));
  890. GB_ASSERT(type_size_of(array_type) == type_size_of(xt));
  891. array_lhs.type = array_type;
  892. array_rhs.type = array_type;
  893. if (token_is_comparison(op)) {
  894. lbValue res = lb_emit_comp(p, op, array_lhs, array_rhs);
  895. return lb_emit_conv(p, res, type);
  896. } else {
  897. lbValue array = lb_emit_arith(p, op, array_lhs, array_rhs, array_type);
  898. array.type = type;
  899. return array;
  900. }
  901. }
  902. GB_PANIC("TODO: lb_emit_arith_matrix");
  903. return {};
  904. }
  905. gb_internal lbValue lb_emit_arith(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type) {
  906. if (is_type_array_like(lhs.type) || is_type_array_like(rhs.type)) {
  907. return lb_emit_arith_array(p, op, lhs, rhs, type);
  908. } else if (is_type_matrix(lhs.type) || is_type_matrix(rhs.type)) {
  909. return lb_emit_arith_matrix(p, op, lhs, rhs, type, false);
  910. } else if (is_type_complex(type)) {
  911. lhs = lb_emit_conv(p, lhs, type);
  912. rhs = lb_emit_conv(p, rhs, type);
  913. Type *ft = base_complex_elem_type(type);
  914. if (op == Token_Quo) {
  915. TEMPORARY_ALLOCATOR_GUARD();
  916. auto args = array_make<lbValue>(temporary_allocator(), 2);
  917. args[0] = lhs;
  918. args[1] = rhs;
  919. switch (type_size_of(ft)) {
  920. case 2: return lb_emit_runtime_call(p, "quo_complex32", args);
  921. case 4: return lb_emit_runtime_call(p, "quo_complex64", args);
  922. case 8: return lb_emit_runtime_call(p, "quo_complex128", args);
  923. default: GB_PANIC("Unknown float type"); break;
  924. }
  925. }
  926. lbAddr res = lb_add_local_generated(p, type, false); // NOTE: initialized in full later
  927. lbValue a = lb_emit_struct_ev(p, lhs, 0);
  928. lbValue b = lb_emit_struct_ev(p, lhs, 1);
  929. lbValue c = lb_emit_struct_ev(p, rhs, 0);
  930. lbValue d = lb_emit_struct_ev(p, rhs, 1);
  931. lbValue real = {};
  932. lbValue imag = {};
  933. switch (op) {
  934. case Token_Add:
  935. case Token_Sub:
  936. if (type_size_of(ft) == 2) {
  937. a = lb_emit_conv(p, a, t_f32);
  938. b = lb_emit_conv(p, b, t_f32);
  939. c = lb_emit_conv(p, c, t_f32);
  940. d = lb_emit_conv(p, d, t_f32);
  941. real = lb_emit_arith(p, op, a, c, t_f32);
  942. imag = lb_emit_arith(p, op, b, d, t_f32);
  943. real = lb_emit_conv(p, real, ft);
  944. imag = lb_emit_conv(p, imag, ft);
  945. } else {
  946. real = lb_emit_arith(p, op, a, c, ft);
  947. imag = lb_emit_arith(p, op, b, d, ft);
  948. }
  949. break;
  950. case Token_Mul: {
  951. lbValue x = lb_emit_arith(p, Token_Mul, a, c, ft);
  952. lbValue y = lb_emit_arith(p, Token_Mul, b, d, ft);
  953. real = lb_emit_arith(p, Token_Sub, x, y, ft);
  954. lbValue z = lb_emit_arith(p, Token_Mul, b, c, ft);
  955. lbValue w = lb_emit_arith(p, Token_Mul, a, d, ft);
  956. imag = lb_emit_arith(p, Token_Add, z, w, ft);
  957. break;
  958. }
  959. }
  960. lb_emit_store(p, lb_emit_struct_ep(p, res.addr, 0), real);
  961. lb_emit_store(p, lb_emit_struct_ep(p, res.addr, 1), imag);
  962. return lb_addr_load(p, res);
  963. } else if (is_type_quaternion(type)) {
  964. lhs = lb_emit_conv(p, lhs, type);
  965. rhs = lb_emit_conv(p, rhs, type);
  966. Type *ft = base_complex_elem_type(type);
  967. if (op == Token_Add || op == Token_Sub) {
  968. Type *immediate_type = ft;
  969. if (type_size_of(ft) == 2) {
  970. immediate_type = t_f32;
  971. }
  972. lbAddr res = lb_add_local_generated(p, type, false); // NOTE: initialized in full later
  973. lbValue x0 = lb_emit_struct_ev(p, lhs, 0);
  974. lbValue x1 = lb_emit_struct_ev(p, lhs, 1);
  975. lbValue x2 = lb_emit_struct_ev(p, lhs, 2);
  976. lbValue x3 = lb_emit_struct_ev(p, lhs, 3);
  977. lbValue y0 = lb_emit_struct_ev(p, rhs, 0);
  978. lbValue y1 = lb_emit_struct_ev(p, rhs, 1);
  979. lbValue y2 = lb_emit_struct_ev(p, rhs, 2);
  980. lbValue y3 = lb_emit_struct_ev(p, rhs, 3);
  981. if (immediate_type != ft) {
  982. x0 = lb_emit_conv(p, x0, immediate_type);
  983. x1 = lb_emit_conv(p, x1, immediate_type);
  984. x2 = lb_emit_conv(p, x2, immediate_type);
  985. x3 = lb_emit_conv(p, x3, immediate_type);
  986. y0 = lb_emit_conv(p, y0, immediate_type);
  987. y1 = lb_emit_conv(p, y1, immediate_type);
  988. y2 = lb_emit_conv(p, y2, immediate_type);
  989. y3 = lb_emit_conv(p, y3, immediate_type);
  990. }
  991. lbValue z0 = lb_emit_arith(p, op, x0, y0, immediate_type);
  992. lbValue z1 = lb_emit_arith(p, op, x1, y1, immediate_type);
  993. lbValue z2 = lb_emit_arith(p, op, x2, y2, immediate_type);
  994. lbValue z3 = lb_emit_arith(p, op, x3, y3, immediate_type);
  995. lbValue d0 = lb_emit_struct_ep(p, res.addr, 0);
  996. lbValue d1 = lb_emit_struct_ep(p, res.addr, 1);
  997. lbValue d2 = lb_emit_struct_ep(p, res.addr, 2);
  998. lbValue d3 = lb_emit_struct_ep(p, res.addr, 3);
  999. if (immediate_type != ft) {
  1000. z0 = lb_emit_conv(p, z0, ft);
  1001. z1 = lb_emit_conv(p, z1, ft);
  1002. z2 = lb_emit_conv(p, z2, ft);
  1003. z3 = lb_emit_conv(p, z3, ft);
  1004. }
  1005. lb_emit_store(p, d0, z0);
  1006. lb_emit_store(p, d1, z1);
  1007. lb_emit_store(p, d2, z2);
  1008. lb_emit_store(p, d3, z3);
  1009. return lb_addr_load(p, res);
  1010. } else if (op == Token_Mul) {
  1011. TEMPORARY_ALLOCATOR_GUARD();
  1012. auto args = array_make<lbValue>(temporary_allocator(), 2);
  1013. args[0] = lhs;
  1014. args[1] = rhs;
  1015. switch (8*type_size_of(ft)) {
  1016. case 16: return lb_emit_runtime_call(p, "mul_quaternion64", args);
  1017. case 32: return lb_emit_runtime_call(p, "mul_quaternion128", args);
  1018. case 64: return lb_emit_runtime_call(p, "mul_quaternion256", args);
  1019. default: GB_PANIC("Unknown float type"); break;
  1020. }
  1021. } else if (op == Token_Quo) {
  1022. TEMPORARY_ALLOCATOR_GUARD();
  1023. auto args = array_make<lbValue>(temporary_allocator(), 2);
  1024. args[0] = lhs;
  1025. args[1] = rhs;
  1026. switch (8*type_size_of(ft)) {
  1027. case 16: return lb_emit_runtime_call(p, "quo_quaternion64", args);
  1028. case 32: return lb_emit_runtime_call(p, "quo_quaternion128", args);
  1029. case 64: return lb_emit_runtime_call(p, "quo_quaternion256", args);
  1030. default: GB_PANIC("Unknown float type"); break;
  1031. }
  1032. }
  1033. }
  1034. lhs = lb_emit_conv(p, lhs, type);
  1035. rhs = lb_emit_conv(p, rhs, type);
  1036. if (is_type_integer(type) && is_type_different_to_arch_endianness(type)) {
  1037. switch (op) {
  1038. case Token_AndNot:
  1039. case Token_And:
  1040. case Token_Or:
  1041. case Token_Xor:
  1042. goto handle_op;
  1043. }
  1044. Type *platform_type = integer_endian_type_to_platform_type(type);
  1045. lbValue x = lb_emit_byte_swap(p, lhs, integer_endian_type_to_platform_type(lhs.type));
  1046. lbValue y = lb_emit_byte_swap(p, rhs, integer_endian_type_to_platform_type(rhs.type));
  1047. lbValue res = lb_emit_arith(p, op, x, y, platform_type);
  1048. return lb_emit_byte_swap(p, res, type);
  1049. }
  1050. if (is_type_float(type) && is_type_different_to_arch_endianness(type)) {
  1051. Type *platform_type = integer_endian_type_to_platform_type(type);
  1052. lbValue x = lb_emit_conv(p, lhs, integer_endian_type_to_platform_type(lhs.type));
  1053. lbValue y = lb_emit_conv(p, rhs, integer_endian_type_to_platform_type(rhs.type));
  1054. lbValue res = lb_emit_arith(p, op, x, y, platform_type);
  1055. return lb_emit_byte_swap(p, res, type);
  1056. }
  1057. handle_op:;
  1058. lbValue res = {};
  1059. res.type = type;
  1060. // NOTE(bill): Bit Set Aliases for + and -
  1061. if (is_type_bit_set(type)) {
  1062. switch (op) {
  1063. case Token_Add: op = Token_Or; break;
  1064. case Token_Sub: op = Token_AndNot; break;
  1065. }
  1066. Type *u = bit_set_to_int(type);
  1067. if (is_type_array(u)) {
  1068. lhs.type = u;
  1069. rhs.type = u;
  1070. res = lb_emit_arith(p, op, lhs, rhs, u);
  1071. res.type = type;
  1072. return res;
  1073. }
  1074. }
  1075. Type *integral_type = type;
  1076. if (is_type_simd_vector(integral_type)) {
  1077. integral_type = core_array_type(integral_type);
  1078. }
  1079. switch (op) {
  1080. case Token_Add:
  1081. if (is_type_float(integral_type)) {
  1082. res.value = LLVMBuildFAdd(p->builder, lhs.value, rhs.value, "");
  1083. return res;
  1084. }
  1085. res.value = LLVMBuildAdd(p->builder, lhs.value, rhs.value, "");
  1086. return res;
  1087. case Token_Sub:
  1088. if (is_type_float(integral_type)) {
  1089. res.value = LLVMBuildFSub(p->builder, lhs.value, rhs.value, "");
  1090. return res;
  1091. }
  1092. res.value = LLVMBuildSub(p->builder, lhs.value, rhs.value, "");
  1093. return res;
  1094. case Token_Mul:
  1095. if (is_type_float(integral_type)) {
  1096. res.value = LLVMBuildFMul(p->builder, lhs.value, rhs.value, "");
  1097. return res;
  1098. }
  1099. res.value = LLVMBuildMul(p->builder, lhs.value, rhs.value, "");
  1100. return res;
  1101. case Token_Quo:
  1102. if (is_type_float(integral_type)) {
  1103. res.value = LLVMBuildFDiv(p->builder, lhs.value, rhs.value, "");
  1104. return res;
  1105. } else if (is_type_unsigned(integral_type)) {
  1106. res.value = LLVMBuildUDiv(p->builder, lhs.value, rhs.value, "");
  1107. return res;
  1108. }
  1109. res.value = LLVMBuildSDiv(p->builder, lhs.value, rhs.value, "");
  1110. return res;
  1111. case Token_Mod:
  1112. if (is_type_float(integral_type)) {
  1113. res.value = LLVMBuildFRem(p->builder, lhs.value, rhs.value, "");
  1114. return res;
  1115. } else if (is_type_unsigned(integral_type)) {
  1116. res.value = LLVMBuildURem(p->builder, lhs.value, rhs.value, "");
  1117. return res;
  1118. }
  1119. res.value = LLVMBuildSRem(p->builder, lhs.value, rhs.value, "");
  1120. return res;
  1121. case Token_ModMod:
  1122. if (is_type_unsigned(integral_type)) {
  1123. res.value = LLVMBuildURem(p->builder, lhs.value, rhs.value, "");
  1124. return res;
  1125. } else {
  1126. LLVMValueRef a = LLVMBuildSRem(p->builder, lhs.value, rhs.value, "");
  1127. LLVMValueRef b = LLVMBuildAdd(p->builder, a, rhs.value, "");
  1128. LLVMValueRef c = LLVMBuildSRem(p->builder, b, rhs.value, "");
  1129. res.value = c;
  1130. return res;
  1131. }
  1132. case Token_And:
  1133. res.value = LLVMBuildAnd(p->builder, lhs.value, rhs.value, "");
  1134. return res;
  1135. case Token_Or:
  1136. res.value = LLVMBuildOr(p->builder, lhs.value, rhs.value, "");
  1137. return res;
  1138. case Token_Xor:
  1139. res.value = LLVMBuildXor(p->builder, lhs.value, rhs.value, "");
  1140. return res;
  1141. case Token_Shl:
  1142. {
  1143. rhs = lb_emit_conv(p, rhs, lhs.type);
  1144. LLVMValueRef lhsval = lhs.value;
  1145. LLVMValueRef bits = rhs.value;
  1146. LLVMValueRef bit_size = LLVMConstInt(lb_type(p->module, rhs.type), 8*type_size_of(lhs.type), false);
  1147. LLVMValueRef width_test = LLVMBuildICmp(p->builder, LLVMIntULT, bits, bit_size, "");
  1148. res.value = LLVMBuildShl(p->builder, lhsval, bits, "");
  1149. LLVMValueRef zero = LLVMConstNull(lb_type(p->module, lhs.type));
  1150. res.value = LLVMBuildSelect(p->builder, width_test, res.value, zero, "");
  1151. return res;
  1152. }
  1153. case Token_Shr:
  1154. {
  1155. rhs = lb_emit_conv(p, rhs, lhs.type);
  1156. LLVMValueRef lhsval = lhs.value;
  1157. LLVMValueRef bits = rhs.value;
  1158. bool is_unsigned = is_type_unsigned(integral_type);
  1159. LLVMValueRef bit_size = LLVMConstInt(lb_type(p->module, rhs.type), 8*type_size_of(lhs.type), false);
  1160. LLVMValueRef width_test = LLVMBuildICmp(p->builder, LLVMIntULT, bits, bit_size, "");
  1161. if (is_unsigned) {
  1162. res.value = LLVMBuildLShr(p->builder, lhsval, bits, "");
  1163. } else {
  1164. res.value = LLVMBuildAShr(p->builder, lhsval, bits, "");
  1165. }
  1166. LLVMValueRef zero = LLVMConstNull(lb_type(p->module, lhs.type));
  1167. res.value = LLVMBuildSelect(p->builder, width_test, res.value, zero, "");
  1168. return res;
  1169. }
  1170. case Token_AndNot:
  1171. {
  1172. LLVMValueRef new_rhs = LLVMBuildNot(p->builder, rhs.value, "");
  1173. res.value = LLVMBuildAnd(p->builder, lhs.value, new_rhs, "");
  1174. return res;
  1175. }
  1176. break;
  1177. }
  1178. GB_PANIC("unhandled operator of lb_emit_arith");
  1179. return {};
  1180. }
  1181. gb_internal bool lb_is_empty_string_constant(Ast *expr) {
  1182. if (expr->tav.value.kind == ExactValue_String &&
  1183. is_type_string(expr->tav.type)) {
  1184. String s = expr->tav.value.value_string;
  1185. return s.len == 0;
  1186. }
  1187. return false;
  1188. }
  1189. gb_internal lbValue lb_build_binary_in(lbProcedure *p, lbValue left, lbValue right, TokenKind op) {
  1190. Type *rt = base_type(right.type);
  1191. if (is_type_pointer(rt)) {
  1192. right = lb_emit_load(p, right);
  1193. rt = base_type(type_deref(rt));
  1194. }
  1195. switch (rt->kind) {
  1196. case Type_Map:
  1197. {
  1198. lbValue map_ptr = lb_address_from_load_or_generate_local(p, right);
  1199. lbValue key = left;
  1200. lbValue ptr = lb_internal_dynamic_map_get_ptr(p, map_ptr, key);
  1201. if (op == Token_in) {
  1202. return lb_emit_conv(p, lb_emit_comp_against_nil(p, Token_NotEq, ptr), t_bool);
  1203. } else {
  1204. return lb_emit_conv(p, lb_emit_comp_against_nil(p, Token_CmpEq, ptr), t_bool);
  1205. }
  1206. }
  1207. break;
  1208. case Type_BitSet:
  1209. {
  1210. Type *key_type = rt->BitSet.elem;
  1211. GB_ASSERT(are_types_identical(left.type, key_type));
  1212. Type *it = bit_set_to_int(rt);
  1213. left = lb_emit_conv(p, left, it);
  1214. if (is_type_different_to_arch_endianness(it)) {
  1215. left = lb_emit_byte_swap(p, left, integer_endian_type_to_platform_type(it));
  1216. }
  1217. lbValue lower = lb_const_value(p->module, left.type, exact_value_i64(rt->BitSet.lower));
  1218. lbValue key = lb_emit_arith(p, Token_Sub, left, lower, left.type);
  1219. lbValue bit = lb_emit_arith(p, Token_Shl, lb_const_int(p->module, left.type, 1), key, left.type);
  1220. bit = lb_emit_conv(p, bit, it);
  1221. lbValue old_value = lb_emit_transmute(p, right, it);
  1222. lbValue new_value = lb_emit_arith(p, Token_And, old_value, bit, it);
  1223. if (op == Token_in) {
  1224. return lb_emit_conv(p, lb_emit_comp(p, Token_NotEq, new_value, lb_const_int(p->module, new_value.type, 0)), t_bool);
  1225. } else {
  1226. return lb_emit_conv(p, lb_emit_comp(p, Token_CmpEq, new_value, lb_const_int(p->module, new_value.type, 0)), t_bool);
  1227. }
  1228. }
  1229. break;
  1230. }
  1231. GB_PANIC("Invalid 'in' type");
  1232. return {};
  1233. }
  1234. gb_internal lbValue lb_build_binary_expr(lbProcedure *p, Ast *expr) {
  1235. ast_node(be, BinaryExpr, expr);
  1236. TypeAndValue tv = type_and_value_of_expr(expr);
  1237. if (is_type_matrix(be->left->tav.type) || is_type_matrix(be->right->tav.type)) {
  1238. lbValue left = lb_build_expr(p, be->left);
  1239. lbValue right = lb_build_expr(p, be->right);
  1240. return lb_emit_arith_matrix(p, be->op.kind, left, right, default_type(tv.type), false);
  1241. }
  1242. switch (be->op.kind) {
  1243. case Token_Add:
  1244. case Token_Sub:
  1245. case Token_Mul:
  1246. case Token_Quo:
  1247. case Token_Mod:
  1248. case Token_ModMod:
  1249. case Token_And:
  1250. case Token_Or:
  1251. case Token_Xor:
  1252. case Token_AndNot: {
  1253. Type *type = default_type(tv.type);
  1254. lbValue left = lb_build_expr(p, be->left);
  1255. lbValue right = lb_build_expr(p, be->right);
  1256. return lb_emit_arith(p, be->op.kind, left, right, type);
  1257. }
  1258. case Token_Shl:
  1259. case Token_Shr: {
  1260. lbValue left, right;
  1261. Type *type = default_type(tv.type);
  1262. left = lb_build_expr(p, be->left);
  1263. if (lb_is_expr_untyped_const(be->right)) {
  1264. // NOTE(bill): RHS shift operands can still be untyped
  1265. // Just bypass the standard lb_build_expr
  1266. right = lb_expr_untyped_const_to_typed(p->module, be->right, type);
  1267. } else {
  1268. right = lb_build_expr(p, be->right);
  1269. }
  1270. return lb_emit_arith(p, be->op.kind, left, right, type);
  1271. }
  1272. case Token_CmpEq:
  1273. case Token_NotEq:
  1274. if (is_type_untyped_nil(be->right->tav.type)) {
  1275. // `x == nil` or `x != nil`
  1276. lbValue left = lb_build_expr(p, be->left);
  1277. lbValue cmp = lb_emit_comp_against_nil(p, be->op.kind, left);
  1278. Type *type = default_type(tv.type);
  1279. return lb_emit_conv(p, cmp, type);
  1280. } else if (is_type_untyped_nil(be->left->tav.type)) {
  1281. // `nil == x` or `nil != x`
  1282. lbValue right = lb_build_expr(p, be->right);
  1283. lbValue cmp = lb_emit_comp_against_nil(p, be->op.kind, right);
  1284. Type *type = default_type(tv.type);
  1285. return lb_emit_conv(p, cmp, type);
  1286. } else if (lb_is_empty_string_constant(be->right) && !is_type_union(be->left->tav.type)) {
  1287. // `x == ""` or `x != ""`
  1288. lbValue s = lb_build_expr(p, be->left);
  1289. s = lb_emit_conv(p, s, t_string);
  1290. lbValue len = lb_string_len(p, s);
  1291. lbValue cmp = lb_emit_comp(p, be->op.kind, len, lb_const_int(p->module, t_int, 0));
  1292. Type *type = default_type(tv.type);
  1293. return lb_emit_conv(p, cmp, type);
  1294. } else if (lb_is_empty_string_constant(be->left) && !is_type_union(be->right->tav.type)) {
  1295. // `"" == x` or `"" != x`
  1296. lbValue s = lb_build_expr(p, be->right);
  1297. s = lb_emit_conv(p, s, t_string);
  1298. lbValue len = lb_string_len(p, s);
  1299. lbValue cmp = lb_emit_comp(p, be->op.kind, len, lb_const_int(p->module, t_int, 0));
  1300. Type *type = default_type(tv.type);
  1301. return lb_emit_conv(p, cmp, type);
  1302. }
  1303. /*fallthrough*/
  1304. case Token_Lt:
  1305. case Token_LtEq:
  1306. case Token_Gt:
  1307. case Token_GtEq:
  1308. {
  1309. lbValue left = {};
  1310. lbValue right = {};
  1311. if (be->left->tav.mode == Addressing_Type) {
  1312. left = lb_typeid(p->module, be->left->tav.type);
  1313. }
  1314. if (be->right->tav.mode == Addressing_Type) {
  1315. right = lb_typeid(p->module, be->right->tav.type);
  1316. }
  1317. if (left.value == nullptr) left = lb_build_expr(p, be->left);
  1318. if (right.value == nullptr) right = lb_build_expr(p, be->right);
  1319. lbValue cmp = lb_emit_comp(p, be->op.kind, left, right);
  1320. Type *type = default_type(tv.type);
  1321. return lb_emit_conv(p, cmp, type);
  1322. }
  1323. case Token_CmpAnd:
  1324. case Token_CmpOr:
  1325. return lb_emit_logical_binary_expr(p, be->op.kind, be->left, be->right, tv.type);
  1326. case Token_in:
  1327. case Token_not_in:
  1328. {
  1329. lbValue left = lb_build_expr(p, be->left);
  1330. lbValue right = lb_build_expr(p, be->right);
  1331. return lb_build_binary_in(p, left, right, be->op.kind);
  1332. }
  1333. default:
  1334. GB_PANIC("Invalid binary expression");
  1335. break;
  1336. }
  1337. return {};
  1338. }
  1339. gb_internal lbValue lb_emit_conv(lbProcedure *p, lbValue value, Type *t) {
  1340. lbModule *m = p->module;
  1341. t = reduce_tuple_to_single_type(t);
  1342. Type *src_type = value.type;
  1343. if (are_types_identical(t, src_type)) {
  1344. return value;
  1345. }
  1346. Type *src = core_type(src_type);
  1347. Type *dst = core_type(t);
  1348. GB_ASSERT(src != nullptr);
  1349. GB_ASSERT(dst != nullptr);
  1350. if (is_type_untyped_uninit(src)) {
  1351. return lb_const_undef(m, t);
  1352. }
  1353. if (is_type_untyped_nil(src)) {
  1354. return lb_const_nil(m, t);
  1355. }
  1356. if (LLVMIsConstant(value.value)) {
  1357. if (is_type_any(dst)) {
  1358. Type *st = default_type(src_type);
  1359. lbAddr default_value = lb_add_local_generated(p, st, false);
  1360. lb_addr_store(p, default_value, value);
  1361. lbValue data = lb_emit_conv(p, default_value.addr, t_rawptr);
  1362. lbValue id = lb_typeid(m, st);
  1363. lbAddr res = lb_add_local_generated(p, t, false);
  1364. lbValue a0 = lb_emit_struct_ep(p, res.addr, 0);
  1365. lbValue a1 = lb_emit_struct_ep(p, res.addr, 1);
  1366. lb_emit_store(p, a0, data);
  1367. lb_emit_store(p, a1, id);
  1368. return lb_addr_load(p, res);
  1369. } else if (dst->kind == Type_Basic) {
  1370. if (src->kind == Type_Basic && src->Basic.kind == Basic_string && dst->Basic.kind == Basic_cstring) {
  1371. String str = lb_get_const_string(m, value);
  1372. lbValue res = {};
  1373. res.type = t;
  1374. res.value = llvm_cstring(m, str);
  1375. return res;
  1376. }
  1377. // if (is_type_float(dst)) {
  1378. // return value;
  1379. // } else if (is_type_integer(dst)) {
  1380. // return value;
  1381. // }
  1382. // ExactValue ev = value->Constant.value;
  1383. // if (is_type_float(dst)) {
  1384. // ev = exact_value_to_float(ev);
  1385. // } else if (is_type_complex(dst)) {
  1386. // ev = exact_value_to_complex(ev);
  1387. // } else if (is_type_quaternion(dst)) {
  1388. // ev = exact_value_to_quaternion(ev);
  1389. // } else if (is_type_string(dst)) {
  1390. // // Handled elsewhere
  1391. // GB_ASSERT_MSG(ev.kind == ExactValue_String, "%d", ev.kind);
  1392. // } else if (is_type_integer(dst)) {
  1393. // ev = exact_value_to_integer(ev);
  1394. // } else if (is_type_pointer(dst)) {
  1395. // // IMPORTANT NOTE(bill): LLVM doesn't support pointer constants expect 'null'
  1396. // lbValue i = lb_add_module_constant(p->module, t_uintptr, ev);
  1397. // return lb_emit(p, lb_instr_conv(p, irConv_inttoptr, i, t_uintptr, dst));
  1398. // }
  1399. // return lb_const_value(p->module, t, ev);
  1400. }
  1401. }
  1402. if (are_types_identical(src, dst)) {
  1403. if (!are_types_identical(src_type, t)) {
  1404. return lb_emit_transmute(p, value, t);
  1405. }
  1406. return value;
  1407. }
  1408. // bool <-> llvm bool
  1409. if (is_type_boolean(src) && dst == t_llvm_bool) {
  1410. lbValue res = {};
  1411. res.value = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(lb_type(m, src)), "");
  1412. res.type = t;
  1413. return res;
  1414. }
  1415. if (src == t_llvm_bool && is_type_boolean(dst)) {
  1416. lbValue res = {};
  1417. res.value = LLVMBuildZExt(p->builder, value.value, lb_type(m, dst), "");
  1418. res.type = t;
  1419. return res;
  1420. }
  1421. // integer -> integer
  1422. if (is_type_integer(src) && is_type_integer(dst)) {
  1423. GB_ASSERT(src->kind == Type_Basic &&
  1424. dst->kind == Type_Basic);
  1425. i64 sz = type_size_of(default_type(src));
  1426. i64 dz = type_size_of(default_type(dst));
  1427. if (sz == dz) {
  1428. if (dz > 1 && !types_have_same_internal_endian(src, dst)) {
  1429. return lb_emit_byte_swap(p, value, t);
  1430. }
  1431. lbValue res = {};
  1432. res.value = value.value;
  1433. res.type = t;
  1434. return res;
  1435. }
  1436. if (sz > 1 && is_type_different_to_arch_endianness(src)) {
  1437. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1438. value = lb_emit_byte_swap(p, value, platform_src_type);
  1439. }
  1440. LLVMOpcode op = LLVMTrunc;
  1441. if (dz < sz) {
  1442. op = LLVMTrunc;
  1443. } else if (dz == sz) {
  1444. // NOTE(bill): In LLVM, all integers are signed and rely upon 2's compliment
  1445. // NOTE(bill): Copy the value just for type correctness
  1446. op = LLVMBitCast;
  1447. } else if (dz > sz) {
  1448. op = is_type_unsigned(src) ? LLVMZExt : LLVMSExt; // zero extent
  1449. }
  1450. if (dz > 1 && is_type_different_to_arch_endianness(dst)) {
  1451. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1452. lbValue res = {};
  1453. res.value = LLVMBuildCast(p->builder, op, value.value, lb_type(m, platform_dst_type), "");
  1454. res.type = t;
  1455. return lb_emit_byte_swap(p, res, t);
  1456. } else {
  1457. lbValue res = {};
  1458. res.value = LLVMBuildCast(p->builder, op, value.value, lb_type(m, t), "");
  1459. res.type = t;
  1460. return res;
  1461. }
  1462. }
  1463. // boolean -> boolean/integer
  1464. if (is_type_boolean(src) && (is_type_boolean(dst) || is_type_integer(dst))) {
  1465. LLVMValueRef b = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(lb_type(m, value.type)), "");
  1466. lbValue res = {};
  1467. res.value = LLVMBuildIntCast2(p->builder, b, lb_type(m, t), false, "");
  1468. res.type = t;
  1469. return res;
  1470. }
  1471. if (is_type_cstring(src) && is_type_u8_ptr(dst)) {
  1472. return lb_emit_transmute(p, value, dst);
  1473. }
  1474. if (is_type_u8_ptr(src) && is_type_cstring(dst)) {
  1475. return lb_emit_transmute(p, value, dst);
  1476. }
  1477. if (is_type_cstring(src) && is_type_u8_multi_ptr(dst)) {
  1478. return lb_emit_transmute(p, value, dst);
  1479. }
  1480. if (is_type_u8_multi_ptr(src) && is_type_cstring(dst)) {
  1481. return lb_emit_transmute(p, value, dst);
  1482. }
  1483. if (is_type_cstring(src) && is_type_rawptr(dst)) {
  1484. return lb_emit_transmute(p, value, dst);
  1485. }
  1486. if (is_type_rawptr(src) && is_type_cstring(dst)) {
  1487. return lb_emit_transmute(p, value, dst);
  1488. }
  1489. if (are_types_identical(src, t_cstring) && are_types_identical(dst, t_string)) {
  1490. TEMPORARY_ALLOCATOR_GUARD();
  1491. lbValue c = lb_emit_conv(p, value, t_cstring);
  1492. auto args = array_make<lbValue>(temporary_allocator(), 1);
  1493. args[0] = c;
  1494. lbValue s = lb_emit_runtime_call(p, "cstring_to_string", args);
  1495. return lb_emit_conv(p, s, dst);
  1496. }
  1497. // integer -> boolean
  1498. if (is_type_integer(src) && is_type_boolean(dst)) {
  1499. lbValue res = {};
  1500. res.value = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(lb_type(m, value.type)), "");
  1501. res.type = t_llvm_bool;
  1502. return lb_emit_conv(p, res, t);
  1503. }
  1504. // float -> float
  1505. if (is_type_float(src) && is_type_float(dst)) {
  1506. i64 sz = type_size_of(src);
  1507. i64 dz = type_size_of(dst);
  1508. if (dz == sz) {
  1509. if (types_have_same_internal_endian(src, dst)) {
  1510. lbValue res = {};
  1511. res.type = t;
  1512. res.value = value.value;
  1513. return res;
  1514. } else {
  1515. return lb_emit_byte_swap(p, value, t);
  1516. }
  1517. }
  1518. if (is_type_different_to_arch_endianness(src) || is_type_different_to_arch_endianness(dst)) {
  1519. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1520. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1521. lbValue res = {};
  1522. res = lb_emit_conv(p, value, platform_src_type);
  1523. res = lb_emit_conv(p, res, platform_dst_type);
  1524. if (is_type_different_to_arch_endianness(dst)) {
  1525. res = lb_emit_byte_swap(p, res, t);
  1526. }
  1527. return lb_emit_conv(p, res, t);
  1528. }
  1529. lbValue res = {};
  1530. res.type = t;
  1531. if (dz >= sz) {
  1532. res.value = LLVMBuildFPExt(p->builder, value.value, lb_type(m, t), "");
  1533. } else {
  1534. res.value = LLVMBuildFPTrunc(p->builder, value.value, lb_type(m, t), "");
  1535. }
  1536. return res;
  1537. }
  1538. if (is_type_complex(src) && is_type_complex(dst)) {
  1539. Type *ft = base_complex_elem_type(dst);
  1540. lbAddr gen = lb_add_local_generated(p, t, false);
  1541. lbValue gp = lb_addr_get_ptr(p, gen);
  1542. lbValue real = lb_emit_conv(p, lb_emit_struct_ev(p, value, 0), ft);
  1543. lbValue imag = lb_emit_conv(p, lb_emit_struct_ev(p, value, 1), ft);
  1544. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), real);
  1545. lb_emit_store(p, lb_emit_struct_ep(p, gp, 1), imag);
  1546. return lb_addr_load(p, gen);
  1547. }
  1548. if (is_type_quaternion(src) && is_type_quaternion(dst)) {
  1549. // @QuaternionLayout
  1550. Type *ft = base_complex_elem_type(dst);
  1551. lbAddr gen = lb_add_local_generated(p, t, false);
  1552. lbValue gp = lb_addr_get_ptr(p, gen);
  1553. lbValue q0 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 0), ft);
  1554. lbValue q1 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 1), ft);
  1555. lbValue q2 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 2), ft);
  1556. lbValue q3 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 3), ft);
  1557. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), q0);
  1558. lb_emit_store(p, lb_emit_struct_ep(p, gp, 1), q1);
  1559. lb_emit_store(p, lb_emit_struct_ep(p, gp, 2), q2);
  1560. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), q3);
  1561. return lb_addr_load(p, gen);
  1562. }
  1563. if (is_type_integer(src) && is_type_complex(dst)) {
  1564. Type *ft = base_complex_elem_type(dst);
  1565. lbAddr gen = lb_add_local_generated(p, t, true);
  1566. lbValue gp = lb_addr_get_ptr(p, gen);
  1567. lbValue real = lb_emit_conv(p, value, ft);
  1568. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), real);
  1569. return lb_addr_load(p, gen);
  1570. }
  1571. if (is_type_float(src) && is_type_complex(dst)) {
  1572. Type *ft = base_complex_elem_type(dst);
  1573. lbAddr gen = lb_add_local_generated(p, t, true);
  1574. lbValue gp = lb_addr_get_ptr(p, gen);
  1575. lbValue real = lb_emit_conv(p, value, ft);
  1576. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), real);
  1577. return lb_addr_load(p, gen);
  1578. }
  1579. if (is_type_integer(src) && is_type_quaternion(dst)) {
  1580. Type *ft = base_complex_elem_type(dst);
  1581. lbAddr gen = lb_add_local_generated(p, t, true);
  1582. lbValue gp = lb_addr_get_ptr(p, gen);
  1583. lbValue real = lb_emit_conv(p, value, ft);
  1584. // @QuaternionLayout
  1585. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), real);
  1586. return lb_addr_load(p, gen);
  1587. }
  1588. if (is_type_float(src) && is_type_quaternion(dst)) {
  1589. Type *ft = base_complex_elem_type(dst);
  1590. lbAddr gen = lb_add_local_generated(p, t, true);
  1591. lbValue gp = lb_addr_get_ptr(p, gen);
  1592. lbValue real = lb_emit_conv(p, value, ft);
  1593. // @QuaternionLayout
  1594. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), real);
  1595. return lb_addr_load(p, gen);
  1596. }
  1597. if (is_type_complex(src) && is_type_quaternion(dst)) {
  1598. Type *ft = base_complex_elem_type(dst);
  1599. lbAddr gen = lb_add_local_generated(p, t, true);
  1600. lbValue gp = lb_addr_get_ptr(p, gen);
  1601. lbValue real = lb_emit_conv(p, lb_emit_struct_ev(p, value, 0), ft);
  1602. lbValue imag = lb_emit_conv(p, lb_emit_struct_ev(p, value, 1), ft);
  1603. // @QuaternionLayout
  1604. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), real);
  1605. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), imag);
  1606. return lb_addr_load(p, gen);
  1607. }
  1608. // float <-> integer
  1609. if (is_type_float(src) && is_type_integer(dst)) {
  1610. if (is_type_different_to_arch_endianness(src) || is_type_different_to_arch_endianness(dst)) {
  1611. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1612. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1613. lbValue res = {};
  1614. res = lb_emit_conv(p, value, platform_src_type);
  1615. res = lb_emit_conv(p, res, platform_dst_type);
  1616. return lb_emit_conv(p, res, t);
  1617. }
  1618. if (is_type_integer_128bit(dst)) {
  1619. TEMPORARY_ALLOCATOR_GUARD();
  1620. auto args = array_make<lbValue>(temporary_allocator(), 1);
  1621. args[0] = value;
  1622. char const *call = "fixunsdfdi";
  1623. if (is_type_unsigned(dst)) {
  1624. call = "fixunsdfti";
  1625. }
  1626. lbValue res_i128 = lb_emit_runtime_call(p, call, args);
  1627. return lb_emit_conv(p, res_i128, t);
  1628. }
  1629. i64 sz = type_size_of(src);
  1630. lbValue res = {};
  1631. res.type = t;
  1632. if (is_type_unsigned(dst)) {
  1633. switch (sz) {
  1634. case 2:
  1635. case 4:
  1636. res.value = LLVMBuildFPToUI(p->builder, value.value, lb_type(m, t_u32), "");
  1637. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), false, "");
  1638. break;
  1639. case 8:
  1640. res.value = LLVMBuildFPToUI(p->builder, value.value, lb_type(m, t_u64), "");
  1641. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), false, "");
  1642. break;
  1643. default:
  1644. GB_PANIC("Unhandled float type");
  1645. break;
  1646. }
  1647. } else {
  1648. switch (sz) {
  1649. case 2:
  1650. case 4:
  1651. res.value = LLVMBuildFPToSI(p->builder, value.value, lb_type(m, t_i32), "");
  1652. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), true, "");
  1653. break;
  1654. case 8:
  1655. res.value = LLVMBuildFPToSI(p->builder, value.value, lb_type(m, t_i64), "");
  1656. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), true, "");
  1657. break;
  1658. default:
  1659. GB_PANIC("Unhandled float type");
  1660. break;
  1661. }
  1662. }
  1663. return res;
  1664. }
  1665. if (is_type_integer(src) && is_type_float(dst)) {
  1666. if (is_type_different_to_arch_endianness(src) || is_type_different_to_arch_endianness(dst)) {
  1667. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1668. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1669. lbValue res = {};
  1670. res = lb_emit_conv(p, value, platform_src_type);
  1671. res = lb_emit_conv(p, res, platform_dst_type);
  1672. if (is_type_different_to_arch_endianness(dst)) {
  1673. res = lb_emit_byte_swap(p, res, t);
  1674. }
  1675. return lb_emit_conv(p, res, t);
  1676. }
  1677. if (is_type_integer_128bit(src)) {
  1678. TEMPORARY_ALLOCATOR_GUARD();
  1679. auto args = array_make<lbValue>(temporary_allocator(), 1);
  1680. args[0] = value;
  1681. char const *call = "floattidf";
  1682. if (is_type_unsigned(src)) {
  1683. call = "floattidf_unsigned";
  1684. }
  1685. lbValue res_f64 = lb_emit_runtime_call(p, call, args);
  1686. return lb_emit_conv(p, res_f64, t);
  1687. }
  1688. lbValue res = {};
  1689. res.type = t;
  1690. if (is_type_unsigned(src)) {
  1691. res.value = LLVMBuildUIToFP(p->builder, value.value, lb_type(m, t), "");
  1692. } else {
  1693. res.value = LLVMBuildSIToFP(p->builder, value.value, lb_type(m, t), "");
  1694. }
  1695. return res;
  1696. }
  1697. if (is_type_simd_vector(dst)) {
  1698. Type *et = base_array_type(dst);
  1699. if (is_type_simd_vector(src)) {
  1700. Type *src_elem = core_array_type(src);
  1701. Type *dst_elem = core_array_type(dst);
  1702. GB_ASSERT(src->SimdVector.count == dst->SimdVector.count);
  1703. lbValue res = {};
  1704. res.type = t;
  1705. if (are_types_identical(src_elem, dst_elem)) {
  1706. res.value = value.value;
  1707. } else if (is_type_float(src_elem) && is_type_integer(dst_elem)) {
  1708. if (is_type_unsigned(dst_elem)) {
  1709. res.value = LLVMBuildFPToUI(p->builder, value.value, lb_type(m, t), "");
  1710. } else {
  1711. res.value = LLVMBuildFPToSI(p->builder, value.value, lb_type(m, t), "");
  1712. }
  1713. } else if (is_type_integer(src_elem) && is_type_float(dst_elem)) {
  1714. if (is_type_unsigned(src_elem)) {
  1715. res.value = LLVMBuildUIToFP(p->builder, value.value, lb_type(m, t), "");
  1716. } else {
  1717. res.value = LLVMBuildSIToFP(p->builder, value.value, lb_type(m, t), "");
  1718. }
  1719. } else if ((is_type_integer(src_elem) || is_type_boolean(src_elem)) && is_type_integer(dst_elem)) {
  1720. res.value = LLVMBuildIntCast2(p->builder, value.value, lb_type(m, t), !is_type_unsigned(src_elem), "");
  1721. } else if (is_type_float(src_elem) && is_type_float(dst_elem)) {
  1722. res.value = LLVMBuildFPCast(p->builder, value.value, lb_type(m, t), "");
  1723. } else if (is_type_integer(src_elem) && is_type_boolean(dst_elem)) {
  1724. LLVMValueRef i1vector = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(LLVMTypeOf(value.value)), "");
  1725. res.value = LLVMBuildIntCast2(p->builder, i1vector, lb_type(m, t), !is_type_unsigned(src_elem), "");
  1726. } else if (is_type_pointer(src_elem) && is_type_integer(dst_elem)) {
  1727. res.value = LLVMBuildPtrToInt(p->builder, value.value, lb_type(m, t), "");
  1728. } else if (is_type_integer(src_elem) && is_type_pointer(dst_elem)) {
  1729. res.value = LLVMBuildIntToPtr(p->builder, value.value, lb_type(m, t), "");
  1730. }else {
  1731. GB_PANIC("Unhandled simd vector conversion: %s -> %s", type_to_string(src), type_to_string(dst));
  1732. }
  1733. return res;
  1734. } else {
  1735. i64 count = get_array_type_count(dst);
  1736. LLVMTypeRef vt = lb_type(m, t);
  1737. LLVMTypeRef llvm_u32 = lb_type(m, t_u32);
  1738. LLVMValueRef elem = lb_emit_conv(p, value, et).value;
  1739. LLVMValueRef vector = LLVMConstNull(vt);
  1740. for (i64 i = 0; i < count; i++) {
  1741. LLVMValueRef idx = LLVMConstInt(llvm_u32, i, false);
  1742. vector = LLVMBuildInsertElement(p->builder, vector, elem, idx, "");
  1743. }
  1744. lbValue res = {};
  1745. res.type = t;
  1746. res.value = vector;
  1747. return res;
  1748. }
  1749. }
  1750. // bit_field <-> backing type
  1751. if (is_type_bit_field(src)) {
  1752. if (are_types_identical(src->BitField.backing_type, dst)) {
  1753. lbValue res = {};
  1754. res.type = t;
  1755. res.value = value.value;
  1756. return res;
  1757. }
  1758. }
  1759. if (is_type_bit_field(dst)) {
  1760. if (are_types_identical(src, dst->BitField.backing_type)) {
  1761. lbValue res = {};
  1762. res.type = t;
  1763. res.value = value.value;
  1764. return res;
  1765. }
  1766. }
  1767. // bit_set <-> backing type
  1768. if (is_type_bit_set(src)) {
  1769. Type *backing = bit_set_to_int(src);
  1770. if (are_types_identical(backing, dst)) {
  1771. lbValue res = {};
  1772. res.type = t;
  1773. res.value = value.value;
  1774. return res;
  1775. }
  1776. }
  1777. if (is_type_bit_set(dst)) {
  1778. Type *backing = bit_set_to_int(dst);
  1779. if (are_types_identical(src, backing)) {
  1780. lbValue res = {};
  1781. res.type = t;
  1782. res.value = value.value;
  1783. return res;
  1784. }
  1785. }
  1786. // Pointer <-> uintptr
  1787. if (is_type_pointer(src) && is_type_uintptr(dst)) {
  1788. lbValue res = {};
  1789. res.type = t;
  1790. res.value = LLVMBuildPtrToInt(p->builder, value.value, lb_type(m, t), "");
  1791. return res;
  1792. }
  1793. if (is_type_uintptr(src) && is_type_pointer(dst)) {
  1794. lbValue res = {};
  1795. res.type = t;
  1796. res.value = LLVMBuildIntToPtr(p->builder, value.value, lb_type(m, t), "");
  1797. return res;
  1798. }
  1799. if (is_type_multi_pointer(src) && is_type_uintptr(dst)) {
  1800. lbValue res = {};
  1801. res.type = t;
  1802. res.value = LLVMBuildPtrToInt(p->builder, value.value, lb_type(m, t), "");
  1803. return res;
  1804. }
  1805. if (is_type_uintptr(src) && is_type_multi_pointer(dst)) {
  1806. lbValue res = {};
  1807. res.type = t;
  1808. res.value = LLVMBuildIntToPtr(p->builder, value.value, lb_type(m, t), "");
  1809. return res;
  1810. }
  1811. if (is_type_union(dst)) {
  1812. if (dst->Union.variants.count == 1) {
  1813. Type *vt = dst->Union.variants[0];
  1814. if (internal_check_is_assignable_to(src_type, vt)) {
  1815. value = lb_emit_conv(p, value, vt);
  1816. lbAddr parent = lb_add_local_generated(p, t, true);
  1817. lb_emit_store_union_variant(p, parent.addr, value, vt);
  1818. return lb_addr_load(p, parent);
  1819. }
  1820. }
  1821. for (Type *vt : dst->Union.variants) {
  1822. if (are_types_identical(src_type, vt)) {
  1823. lbAddr parent = lb_add_local_generated(p, t, true);
  1824. lb_emit_store_union_variant(p, parent.addr, value, vt);
  1825. return lb_addr_load(p, parent);
  1826. }
  1827. }
  1828. ValidIndexAndScore *valids = gb_alloc_array(temporary_allocator(), ValidIndexAndScore, dst->Union.variants.count);
  1829. isize valid_count = 0;
  1830. isize first_success_index = -1;
  1831. for_array(i, dst->Union.variants) {
  1832. Type *vt = dst->Union.variants[i];
  1833. i64 score = 0;
  1834. if (internal_check_is_assignable_to(src_type, vt)) {
  1835. valids[valid_count].index = i;
  1836. valids[valid_count].score = score;
  1837. valid_count += 1;
  1838. if (first_success_index < 0) {
  1839. first_success_index = i;
  1840. }
  1841. }
  1842. }
  1843. if (valid_count > 1) {
  1844. gb_sort_array(valids, valid_count, valid_index_and_score_cmp);
  1845. i64 best_score = valids[0].score;
  1846. for (isize i = 1; i < valid_count; i++) {
  1847. auto v = valids[i];
  1848. if (best_score > v.score) {
  1849. valid_count = i;
  1850. break;
  1851. }
  1852. best_score = v.score;
  1853. }
  1854. first_success_index = valids[0].index;
  1855. }
  1856. if (valid_count == 1) {
  1857. Type *vt = dst->Union.variants[first_success_index];
  1858. value = lb_emit_conv(p, value, vt);
  1859. lbAddr parent = lb_add_local_generated(p, t, true);
  1860. lb_emit_store_union_variant(p, parent.addr, value, vt);
  1861. return lb_addr_load(p, parent);
  1862. }
  1863. }
  1864. // NOTE(bill): This has to be done before 'Pointer <-> Pointer' as it's
  1865. // subtype polymorphism casting
  1866. if (check_is_assignable_to_using_subtype(src_type, t)) {
  1867. Type *st = type_deref(src_type);
  1868. st = type_deref(st);
  1869. bool st_is_ptr = is_type_pointer(src_type);
  1870. st = base_type(st);
  1871. Type *dt = t;
  1872. GB_ASSERT(is_type_struct(st) || is_type_raw_union(st));
  1873. Selection sel = {};
  1874. sel.index.allocator = heap_allocator();
  1875. defer (array_free(&sel.index));
  1876. if (lookup_subtype_polymorphic_selection(t, src_type, &sel)) {
  1877. if (sel.entity == nullptr) {
  1878. GB_PANIC("invalid subtype cast %s -> ", type_to_string(src_type), type_to_string(t));
  1879. }
  1880. if (st_is_ptr) {
  1881. lbValue res = lb_emit_deep_field_gep(p, value, sel);
  1882. Type *rt = res.type;
  1883. if (!are_types_identical(rt, dt) && are_types_identical(type_deref(rt), dt)) {
  1884. res = lb_emit_load(p, res);
  1885. }
  1886. return res;
  1887. } else {
  1888. if (is_type_pointer(value.type)) {
  1889. Type *rt = value.type;
  1890. if (!are_types_identical(rt, dt) && are_types_identical(type_deref(rt), dt)) {
  1891. value = lb_emit_load(p, value);
  1892. } else {
  1893. value = lb_emit_deep_field_gep(p, value, sel);
  1894. return lb_emit_load(p, value);
  1895. }
  1896. }
  1897. return lb_emit_deep_field_ev(p, value, sel);
  1898. }
  1899. }
  1900. }
  1901. // Pointer <-> Pointer
  1902. if (is_type_pointer(src) && is_type_pointer(dst)) {
  1903. lbValue res = {};
  1904. res.type = t;
  1905. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1906. return res;
  1907. }
  1908. if (is_type_multi_pointer(src) && is_type_pointer(dst)) {
  1909. lbValue res = {};
  1910. res.type = t;
  1911. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1912. return res;
  1913. }
  1914. if (is_type_pointer(src) && is_type_multi_pointer(dst)) {
  1915. lbValue res = {};
  1916. res.type = t;
  1917. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1918. return res;
  1919. }
  1920. if (is_type_multi_pointer(src) && is_type_multi_pointer(dst)) {
  1921. lbValue res = {};
  1922. res.type = t;
  1923. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1924. return res;
  1925. }
  1926. // proc <-> proc
  1927. if (is_type_proc(src) && is_type_proc(dst)) {
  1928. lbValue res = {};
  1929. res.type = t;
  1930. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1931. return res;
  1932. }
  1933. // pointer -> proc
  1934. if (is_type_pointer(src) && is_type_proc(dst)) {
  1935. lbValue res = {};
  1936. res.type = t;
  1937. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1938. return res;
  1939. }
  1940. // proc -> pointer
  1941. if (is_type_proc(src) && is_type_pointer(dst)) {
  1942. lbValue res = {};
  1943. res.type = t;
  1944. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1945. return res;
  1946. }
  1947. // []byte/[]u8 <-> string
  1948. if (is_type_u8_slice(src) && is_type_string(dst)) {
  1949. return lb_emit_transmute(p, value, t);
  1950. }
  1951. if (is_type_string(src) && is_type_u8_slice(dst)) {
  1952. return lb_emit_transmute(p, value, t);
  1953. }
  1954. if (is_type_array_like(dst)) {
  1955. Type *elem = base_array_type(dst);
  1956. isize index_count = cast(isize)get_array_type_count(dst);
  1957. isize inlineable = type_size_of(dst) <= build_context.max_simd_align;
  1958. lbValue e = lb_emit_conv(p, value, elem);
  1959. if (inlineable && lb_is_const(e)) {
  1960. lbAddr v = {};
  1961. if (e.value) {
  1962. TEMPORARY_ALLOCATOR_GUARD();
  1963. LLVMValueRef *values = gb_alloc_array(temporary_allocator(), LLVMValueRef, index_count);
  1964. for (isize i = 0; i < index_count; i++) {
  1965. values[i] = e.value;
  1966. }
  1967. lbValue array_const_value = {};
  1968. array_const_value.type = t;
  1969. array_const_value.value = LLVMConstArray(lb_type(m, elem), values, cast(unsigned)index_count);
  1970. v = lb_add_global_generated(m, t, array_const_value);
  1971. } else {
  1972. v = lb_add_global_generated(m, t);
  1973. }
  1974. lb_make_global_private_const(v);
  1975. return lb_addr_load(p, v);
  1976. }
  1977. // NOTE(bill): Doesn't need to be zero because it will be initialized in the loops
  1978. lbAddr v = lb_add_local_generated(p, t, false);
  1979. if (!inlineable) {
  1980. auto loop_data = lb_loop_start(p, index_count, t_int);
  1981. lbValue elem = lb_emit_array_ep(p, v.addr, loop_data.idx);
  1982. lb_emit_store(p, elem, e);
  1983. lb_loop_end(p, loop_data);
  1984. } else {
  1985. for (isize i = 0; i < index_count; i++) {
  1986. lbValue elem = lb_emit_array_epi(p, v.addr, i);
  1987. lb_emit_store(p, elem, e);
  1988. }
  1989. }
  1990. return lb_addr_load(p, v);
  1991. }
  1992. if (is_type_matrix(dst) && !is_type_matrix(src)) {
  1993. GB_ASSERT_MSG(dst->Matrix.row_count == dst->Matrix.column_count, "%s <- %s", type_to_string(dst), type_to_string(src));
  1994. Type *elem = base_array_type(dst);
  1995. lbValue e = lb_emit_conv(p, value, elem);
  1996. lbAddr v = lb_add_local_generated(p, t, false);
  1997. lbValue zero = lb_const_value(p->module, elem, exact_value_i64(0), true);
  1998. for (i64 j = 0; j < dst->Matrix.column_count; j++) {
  1999. for (i64 i = 0; i < dst->Matrix.row_count; i++) {
  2000. lbValue ptr = lb_emit_matrix_epi(p, v.addr, i, j);
  2001. lb_emit_store(p, ptr, i == j ? e : zero);
  2002. }
  2003. }
  2004. return lb_addr_load(p, v);
  2005. }
  2006. if (is_type_matrix(dst) && is_type_matrix(src)) {
  2007. GB_ASSERT(dst->kind == Type_Matrix);
  2008. GB_ASSERT(src->kind == Type_Matrix);
  2009. lbAddr v = lb_add_local_generated(p, t, true);
  2010. if (dst->Matrix.row_count == src->Matrix.row_count &&
  2011. dst->Matrix.column_count == src->Matrix.column_count) {
  2012. for (i64 j = 0; j < dst->Matrix.column_count; j++) {
  2013. for (i64 i = 0; i < dst->Matrix.row_count; i++) {
  2014. lbValue d = lb_emit_matrix_epi(p, v.addr, i, j);
  2015. lbValue s = lb_emit_matrix_ev(p, value, i, j);
  2016. s = lb_emit_conv(p, s, dst->Matrix.elem);
  2017. lb_emit_store(p, d, s);
  2018. }
  2019. }
  2020. } else if (is_matrix_square(dst) && is_matrix_square(dst)) {
  2021. for (i64 j = 0; j < dst->Matrix.column_count; j++) {
  2022. for (i64 i = 0; i < dst->Matrix.row_count; i++) {
  2023. if (i < src->Matrix.row_count && j < src->Matrix.column_count) {
  2024. lbValue d = lb_emit_matrix_epi(p, v.addr, i, j);
  2025. lbValue s = lb_emit_matrix_ev(p, value, i, j);
  2026. s = lb_emit_conv(p, s, dst->Matrix.elem);
  2027. lb_emit_store(p, d, s);
  2028. } else if (i == j) {
  2029. lbValue d = lb_emit_matrix_epi(p, v.addr, i, j);
  2030. lbValue s = lb_const_value(p->module, dst->Matrix.elem, exact_value_i64(1), true);
  2031. lb_emit_store(p, d, s);
  2032. }
  2033. }
  2034. }
  2035. } else {
  2036. i64 dst_count = dst->Matrix.row_count*dst->Matrix.column_count;
  2037. i64 src_count = src->Matrix.row_count*src->Matrix.column_count;
  2038. GB_ASSERT(dst_count == src_count);
  2039. lbValue pdst = v.addr;
  2040. lbValue psrc = lb_address_from_load_or_generate_local(p, value);
  2041. bool same_elem_base_types = are_types_identical(
  2042. base_type(dst->Matrix.elem),
  2043. base_type(src->Matrix.elem)
  2044. );
  2045. if (same_elem_base_types && type_size_of(dst) == type_size_of(src)) {
  2046. lb_mem_copy_overlapping(p, v.addr, psrc, lb_const_int(p->module, t_int, type_size_of(dst)));
  2047. } else {
  2048. for (i64 i = 0; i < src_count; i++) {
  2049. lbValue dp = lb_emit_array_epi(p, v.addr, matrix_column_major_index_to_offset(dst, i));
  2050. lbValue sp = lb_emit_array_epi(p, psrc, matrix_column_major_index_to_offset(src, i));
  2051. lbValue s = lb_emit_load(p, sp);
  2052. s = lb_emit_conv(p, s, dst->Matrix.elem);
  2053. lb_emit_store(p, dp, s);
  2054. }
  2055. }
  2056. }
  2057. return lb_addr_load(p, v);
  2058. }
  2059. if (is_type_any(dst)) {
  2060. if (is_type_untyped_uninit(src)) {
  2061. return lb_const_undef(p->module, t);
  2062. }
  2063. if (is_type_untyped_nil(src)) {
  2064. return lb_const_nil(p->module, t);
  2065. }
  2066. lbAddr result = lb_add_local_generated(p, t, true);
  2067. Type *st = default_type(src_type);
  2068. lbValue data = lb_address_from_load_or_generate_local(p, value);
  2069. GB_ASSERT_MSG(is_type_pointer(data.type), "%s", type_to_string(data.type));
  2070. GB_ASSERT_MSG(is_type_typed(st), "%s", type_to_string(st));
  2071. data = lb_emit_conv(p, data, t_rawptr);
  2072. lbValue id = lb_typeid(p->module, st);
  2073. lbValue any_data = lb_emit_struct_ep(p, result.addr, 0);
  2074. lbValue any_id = lb_emit_struct_ep(p, result.addr, 1);
  2075. lb_emit_store(p, any_data, data);
  2076. lb_emit_store(p, any_id, id);
  2077. return lb_addr_load(p, result);
  2078. }
  2079. i64 src_sz = type_size_of(src);
  2080. i64 dst_sz = type_size_of(dst);
  2081. if (src_sz == dst_sz) {
  2082. // bit_set <-> integer
  2083. if (is_type_integer(src) && is_type_bit_set(dst)) {
  2084. lbValue res = lb_emit_conv(p, value, bit_set_to_int(dst));
  2085. res.type = t;
  2086. return res;
  2087. }
  2088. if (is_type_bit_set(src) && is_type_integer(dst)) {
  2089. lbValue bs = value;
  2090. bs.type = bit_set_to_int(src);
  2091. return lb_emit_conv(p, bs, dst);
  2092. }
  2093. // typeid <-> integer
  2094. if (is_type_integer(src) && is_type_typeid(dst)) {
  2095. return lb_emit_transmute(p, value, dst);
  2096. }
  2097. if (is_type_typeid(src) && is_type_integer(dst)) {
  2098. return lb_emit_transmute(p, value, dst);
  2099. }
  2100. }
  2101. if (is_type_untyped(src)) {
  2102. if (is_type_string(src) && is_type_string(dst)) {
  2103. lbAddr result = lb_add_local_generated(p, t, false);
  2104. lb_addr_store(p, result, value);
  2105. return lb_addr_load(p, result);
  2106. }
  2107. }
  2108. gb_printf_err("%.*s\n", LIT(p->name));
  2109. gb_printf_err("lb_emit_conv: src -> dst\n");
  2110. gb_printf_err("Not Identical %s != %s\n", type_to_string(src_type), type_to_string(t));
  2111. gb_printf_err("Not Identical %s != %s\n", type_to_string(src), type_to_string(dst));
  2112. gb_printf_err("Not Identical %p != %p\n", src_type, t);
  2113. gb_printf_err("Not Identical %p != %p\n", src, dst);
  2114. GB_PANIC("Invalid type conversion: '%s' to '%s' for procedure '%.*s'",
  2115. type_to_string(src_type), type_to_string(t),
  2116. LIT(p->name));
  2117. return {};
  2118. }
  2119. gb_internal lbValue lb_emit_c_vararg(lbProcedure *p, lbValue arg, Type *type) {
  2120. Type *core = core_type(type);
  2121. if (core->kind == Type_BitSet) {
  2122. core = core_type(bit_set_to_int(core));
  2123. arg = lb_emit_transmute(p, arg, core);
  2124. }
  2125. Type *promoted = c_vararg_promote_type(core);
  2126. return lb_emit_conv(p, arg, promoted);
  2127. }
  2128. gb_internal lbValue lb_compare_records(lbProcedure *p, TokenKind op_kind, lbValue left, lbValue right, Type *type) {
  2129. GB_ASSERT((is_type_struct(type) || is_type_union(type)) && is_type_comparable(type));
  2130. lbValue left_ptr = lb_address_from_load_or_generate_local(p, left);
  2131. lbValue right_ptr = lb_address_from_load_or_generate_local(p, right);
  2132. lbValue res = {};
  2133. if (type_size_of(type) == 0) {
  2134. switch (op_kind) {
  2135. case Token_CmpEq:
  2136. return lb_const_bool(p->module, t_bool, true);
  2137. case Token_NotEq:
  2138. return lb_const_bool(p->module, t_bool, false);
  2139. }
  2140. GB_PANIC("invalid operator");
  2141. }
  2142. TEMPORARY_ALLOCATOR_GUARD();
  2143. if (is_type_simple_compare(type)) {
  2144. // TODO(bill): Test to see if this is actually faster!!!!
  2145. auto args = array_make<lbValue>(temporary_allocator(), 3);
  2146. args[0] = lb_emit_conv(p, left_ptr, t_rawptr);
  2147. args[1] = lb_emit_conv(p, right_ptr, t_rawptr);
  2148. args[2] = lb_const_int(p->module, t_int, type_size_of(type));
  2149. res = lb_emit_runtime_call(p, "memory_equal", args);
  2150. } else {
  2151. lbValue value = lb_equal_proc_for_type(p->module, type);
  2152. auto args = array_make<lbValue>(temporary_allocator(), 2);
  2153. args[0] = lb_emit_conv(p, left_ptr, t_rawptr);
  2154. args[1] = lb_emit_conv(p, right_ptr, t_rawptr);
  2155. res = lb_emit_call(p, value, args);
  2156. }
  2157. if (op_kind == Token_NotEq) {
  2158. res = lb_emit_unary_arith(p, Token_Not, res, res.type);
  2159. }
  2160. return res;
  2161. }
  2162. gb_internal lbValue lb_emit_comp(lbProcedure *p, TokenKind op_kind, lbValue left, lbValue right) {
  2163. Type *a = core_type(left.type);
  2164. Type *b = core_type(right.type);
  2165. GB_ASSERT(gb_is_between(op_kind, Token__ComparisonBegin+1, Token__ComparisonEnd-1));
  2166. lbValue nil_check = {};
  2167. if (is_type_array_like(left.type) || is_type_array_like(right.type)) {
  2168. // don't do `nil` check if it is array-like
  2169. } else if (is_type_untyped_nil(left.type)) {
  2170. nil_check = lb_emit_comp_against_nil(p, op_kind, right);
  2171. } else if (is_type_untyped_nil(right.type)) {
  2172. nil_check = lb_emit_comp_against_nil(p, op_kind, left);
  2173. }
  2174. if (nil_check.value != nullptr) {
  2175. return nil_check;
  2176. }
  2177. if (are_types_identical(a, b)) {
  2178. // NOTE(bill): No need for a conversion
  2179. } else if ((lb_is_const(left) && !is_type_array(left.type)) || lb_is_const_nil(left)) {
  2180. // NOTE(karl): !is_type_array(left.type) is there to avoid lb_emit_conv
  2181. // trying to convert a constant array into a non-array. In that case we
  2182. // want the `else` branch to happen, so it can try to convert the
  2183. // non-array into an array instead.
  2184. if (lb_is_const_nil(left)) {
  2185. if (internal_check_is_assignable_to(right.type, left.type)) {
  2186. right = lb_emit_conv(p, right, left.type);
  2187. }
  2188. return lb_emit_comp_against_nil(p, op_kind, right);
  2189. }
  2190. left = lb_emit_conv(p, left, right.type);
  2191. } else if ((lb_is_const(right) && !is_type_array(right.type)) || lb_is_const_nil(right)) {
  2192. if (lb_is_const_nil(right)) {
  2193. if (internal_check_is_assignable_to(left.type, right.type)) {
  2194. left = lb_emit_conv(p, left, right.type);
  2195. }
  2196. return lb_emit_comp_against_nil(p, op_kind, left);
  2197. }
  2198. right = lb_emit_conv(p, right, left.type);
  2199. } else {
  2200. Type *lt = left.type;
  2201. Type *rt = right.type;
  2202. lt = left.type;
  2203. rt = right.type;
  2204. i64 ls = type_size_of(lt);
  2205. i64 rs = type_size_of(rt);
  2206. // NOTE(bill): Quick heuristic, larger types are usually the target type
  2207. if (ls < rs) {
  2208. left = lb_emit_conv(p, left, rt);
  2209. } else if (ls > rs) {
  2210. right = lb_emit_conv(p, right, lt);
  2211. } else {
  2212. if (is_type_union(rt)) {
  2213. left = lb_emit_conv(p, left, rt);
  2214. } else {
  2215. right = lb_emit_conv(p, right, lt);
  2216. }
  2217. }
  2218. }
  2219. a = core_type(left.type);
  2220. b = core_type(right.type);
  2221. if (is_type_matrix(a) && (op_kind == Token_CmpEq || op_kind == Token_NotEq)) {
  2222. Type *tl = base_type(a);
  2223. lbValue lhs = lb_address_from_load_or_generate_local(p, left);
  2224. lbValue rhs = lb_address_from_load_or_generate_local(p, right);
  2225. // TODO(bill): Test to see if this is actually faster!!!!
  2226. auto args = array_make<lbValue>(permanent_allocator(), 3);
  2227. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2228. args[1] = lb_emit_conv(p, rhs, t_rawptr);
  2229. args[2] = lb_const_int(p->module, t_int, type_size_of(tl));
  2230. lbValue val = lb_emit_runtime_call(p, "memory_compare", args);
  2231. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_nil(p->module, val.type));
  2232. return lb_emit_conv(p, res, t_bool);
  2233. }
  2234. if (is_type_array_like(a)) {
  2235. Type *tl = base_type(a);
  2236. lbValue lhs = lb_address_from_load_or_generate_local(p, left);
  2237. lbValue rhs = lb_address_from_load_or_generate_local(p, right);
  2238. TokenKind cmp_op = Token_And;
  2239. lbValue res = lb_const_bool(p->module, t_llvm_bool, true);
  2240. if (op_kind == Token_NotEq) {
  2241. res = lb_const_bool(p->module, t_llvm_bool, false);
  2242. cmp_op = Token_Or;
  2243. } else if (op_kind == Token_CmpEq) {
  2244. res = lb_const_bool(p->module, t_llvm_bool, true);
  2245. cmp_op = Token_And;
  2246. }
  2247. bool inline_array_arith = lb_can_try_to_inline_array_arith(tl);
  2248. i32 count = 0;
  2249. switch (tl->kind) {
  2250. case Type_Array: count = cast(i32)tl->Array.count; break;
  2251. case Type_EnumeratedArray: count = cast(i32)tl->EnumeratedArray.count; break;
  2252. }
  2253. if (inline_array_arith) {
  2254. // inline
  2255. lbAddr val = lb_add_local_generated(p, t_bool, false);
  2256. lb_addr_store(p, val, res);
  2257. for (i32 i = 0; i < count; i++) {
  2258. lbValue x = lb_emit_load(p, lb_emit_array_epi(p, lhs, i));
  2259. lbValue y = lb_emit_load(p, lb_emit_array_epi(p, rhs, i));
  2260. lbValue cmp = lb_emit_comp(p, op_kind, x, y);
  2261. lbValue new_res = lb_emit_arith(p, cmp_op, lb_addr_load(p, val), cmp, t_bool);
  2262. lb_addr_store(p, val, lb_emit_conv(p, new_res, t_bool));
  2263. }
  2264. return lb_addr_load(p, val);
  2265. } else {
  2266. if (is_type_simple_compare(tl) && (op_kind == Token_CmpEq || op_kind == Token_NotEq)) {
  2267. // TODO(bill): Test to see if this is actually faster!!!!
  2268. auto args = array_make<lbValue>(permanent_allocator(), 3);
  2269. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2270. args[1] = lb_emit_conv(p, rhs, t_rawptr);
  2271. args[2] = lb_const_int(p->module, t_int, type_size_of(tl));
  2272. lbValue val = lb_emit_runtime_call(p, "memory_compare", args);
  2273. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_nil(p->module, val.type));
  2274. return lb_emit_conv(p, res, t_bool);
  2275. } else {
  2276. lbAddr val = lb_add_local_generated(p, t_bool, false);
  2277. lb_addr_store(p, val, res);
  2278. auto loop_data = lb_loop_start(p, count, t_i32);
  2279. {
  2280. lbValue i = loop_data.idx;
  2281. lbValue x = lb_emit_load(p, lb_emit_array_ep(p, lhs, i));
  2282. lbValue y = lb_emit_load(p, lb_emit_array_ep(p, rhs, i));
  2283. lbValue cmp = lb_emit_comp(p, op_kind, x, y);
  2284. lbValue new_res = lb_emit_arith(p, cmp_op, lb_addr_load(p, val), cmp, t_bool);
  2285. lb_addr_store(p, val, lb_emit_conv(p, new_res, t_bool));
  2286. }
  2287. lb_loop_end(p, loop_data);
  2288. return lb_addr_load(p, val);
  2289. }
  2290. }
  2291. }
  2292. if ((is_type_struct(a) || is_type_union(a)) && is_type_comparable(a)) {
  2293. return lb_compare_records(p, op_kind, left, right, a);
  2294. }
  2295. if ((is_type_struct(b) || is_type_union(b)) && is_type_comparable(b)) {
  2296. return lb_compare_records(p, op_kind, left, right, b);
  2297. }
  2298. if (is_type_string(a)) {
  2299. if (is_type_cstring(a) && is_type_cstring(b)) {
  2300. left = lb_emit_conv(p, left, t_cstring);
  2301. right = lb_emit_conv(p, right, t_cstring);
  2302. char const *runtime_procedure = nullptr;
  2303. switch (op_kind) {
  2304. case Token_CmpEq: runtime_procedure = "cstring_eq"; break;
  2305. case Token_NotEq: runtime_procedure = "cstring_ne"; break;
  2306. case Token_Lt: runtime_procedure = "cstring_lt"; break;
  2307. case Token_Gt: runtime_procedure = "cstring_gt"; break;
  2308. case Token_LtEq: runtime_procedure = "cstring_le"; break;
  2309. case Token_GtEq: runtime_procedure = "cstring_ge"; break;
  2310. }
  2311. GB_ASSERT(runtime_procedure != nullptr);
  2312. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2313. args[0] = left;
  2314. args[1] = right;
  2315. return lb_emit_runtime_call(p, runtime_procedure, args);
  2316. }
  2317. if (is_type_cstring(a) ^ is_type_cstring(b)) {
  2318. left = lb_emit_conv(p, left, t_string);
  2319. right = lb_emit_conv(p, right, t_string);
  2320. }
  2321. char const *runtime_procedure = nullptr;
  2322. switch (op_kind) {
  2323. case Token_CmpEq: runtime_procedure = "string_eq"; break;
  2324. case Token_NotEq: runtime_procedure = "string_ne"; break;
  2325. case Token_Lt: runtime_procedure = "string_lt"; break;
  2326. case Token_Gt: runtime_procedure = "string_gt"; break;
  2327. case Token_LtEq: runtime_procedure = "string_le"; break;
  2328. case Token_GtEq: runtime_procedure = "string_ge"; break;
  2329. }
  2330. GB_ASSERT(runtime_procedure != nullptr);
  2331. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2332. args[0] = left;
  2333. args[1] = right;
  2334. return lb_emit_runtime_call(p, runtime_procedure, args);
  2335. }
  2336. if (is_type_complex(a)) {
  2337. char const *runtime_procedure = "";
  2338. i64 sz = 8*type_size_of(a);
  2339. switch (sz) {
  2340. case 32:
  2341. switch (op_kind) {
  2342. case Token_CmpEq: runtime_procedure = "complex32_eq"; break;
  2343. case Token_NotEq: runtime_procedure = "complex32_ne"; break;
  2344. }
  2345. break;
  2346. case 64:
  2347. switch (op_kind) {
  2348. case Token_CmpEq: runtime_procedure = "complex64_eq"; break;
  2349. case Token_NotEq: runtime_procedure = "complex64_ne"; break;
  2350. }
  2351. break;
  2352. case 128:
  2353. switch (op_kind) {
  2354. case Token_CmpEq: runtime_procedure = "complex128_eq"; break;
  2355. case Token_NotEq: runtime_procedure = "complex128_ne"; break;
  2356. }
  2357. break;
  2358. }
  2359. GB_ASSERT(runtime_procedure != nullptr);
  2360. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2361. args[0] = left;
  2362. args[1] = right;
  2363. return lb_emit_runtime_call(p, runtime_procedure, args);
  2364. }
  2365. if (is_type_quaternion(a)) {
  2366. char const *runtime_procedure = "";
  2367. i64 sz = 8*type_size_of(a);
  2368. switch (sz) {
  2369. case 64:
  2370. switch (op_kind) {
  2371. case Token_CmpEq: runtime_procedure = "quaternion64_eq"; break;
  2372. case Token_NotEq: runtime_procedure = "quaternion64_ne"; break;
  2373. }
  2374. break;
  2375. case 128:
  2376. switch (op_kind) {
  2377. case Token_CmpEq: runtime_procedure = "quaternion128_eq"; break;
  2378. case Token_NotEq: runtime_procedure = "quaternion128_ne"; break;
  2379. }
  2380. break;
  2381. case 256:
  2382. switch (op_kind) {
  2383. case Token_CmpEq: runtime_procedure = "quaternion256_eq"; break;
  2384. case Token_NotEq: runtime_procedure = "quaternion256_ne"; break;
  2385. }
  2386. break;
  2387. }
  2388. GB_ASSERT(runtime_procedure != nullptr);
  2389. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2390. args[0] = left;
  2391. args[1] = right;
  2392. return lb_emit_runtime_call(p, runtime_procedure, args);
  2393. }
  2394. if (is_type_bit_set(a)) {
  2395. switch (op_kind) {
  2396. case Token_Lt:
  2397. case Token_LtEq:
  2398. case Token_Gt:
  2399. case Token_GtEq:
  2400. {
  2401. Type *it = bit_set_to_int(a);
  2402. lbValue lhs = lb_emit_transmute(p, left, it);
  2403. lbValue rhs = lb_emit_transmute(p, right, it);
  2404. if (is_type_different_to_arch_endianness(it)) {
  2405. it = integer_endian_type_to_platform_type(it);
  2406. lhs = lb_emit_byte_swap(p, lhs, it);
  2407. rhs = lb_emit_byte_swap(p, rhs, it);
  2408. }
  2409. lbValue res = lb_emit_arith(p, Token_And, lhs, rhs, it);
  2410. if (op_kind == Token_Lt || op_kind == Token_LtEq) {
  2411. // (lhs & rhs) == lhs
  2412. res.value = LLVMBuildICmp(p->builder, LLVMIntEQ, res.value, lhs.value, "");
  2413. res.type = t_llvm_bool;
  2414. } else if (op_kind == Token_Gt || op_kind == Token_GtEq) {
  2415. // (lhs & rhs) == rhs
  2416. res.value = LLVMBuildICmp(p->builder, LLVMIntEQ, res.value, rhs.value, "");
  2417. res.type = t_llvm_bool;
  2418. }
  2419. // NOTE(bill): Strict subsets
  2420. if (op_kind == Token_Lt || op_kind == Token_Gt) {
  2421. // res &~ (lhs == rhs)
  2422. lbValue eq = {};
  2423. eq.value = LLVMBuildICmp(p->builder, LLVMIntEQ, lhs.value, rhs.value, "");
  2424. eq.type = t_llvm_bool;
  2425. res = lb_emit_arith(p, Token_AndNot, res, eq, t_llvm_bool);
  2426. }
  2427. return res;
  2428. }
  2429. case Token_CmpEq:
  2430. case Token_NotEq:
  2431. {
  2432. LLVMIntPredicate pred = {};
  2433. switch (op_kind) {
  2434. case Token_CmpEq: pred = LLVMIntEQ; break;
  2435. case Token_NotEq: pred = LLVMIntNE; break;
  2436. }
  2437. lbValue res = {};
  2438. res.type = t_llvm_bool;
  2439. res.value = LLVMBuildICmp(p->builder, pred, left.value, right.value, "");
  2440. return res;
  2441. }
  2442. }
  2443. }
  2444. if (op_kind != Token_CmpEq && op_kind != Token_NotEq) {
  2445. Type *t = left.type;
  2446. if (is_type_integer(t) && is_type_different_to_arch_endianness(t)) {
  2447. Type *platform_type = integer_endian_type_to_platform_type(t);
  2448. lbValue x = lb_emit_byte_swap(p, left, platform_type);
  2449. lbValue y = lb_emit_byte_swap(p, right, platform_type);
  2450. left = x;
  2451. right = y;
  2452. } else if (is_type_float(t) && is_type_different_to_arch_endianness(t)) {
  2453. Type *platform_type = integer_endian_type_to_platform_type(t);
  2454. lbValue x = lb_emit_conv(p, left, platform_type);
  2455. lbValue y = lb_emit_conv(p, right, platform_type);
  2456. left = x;
  2457. right = y;
  2458. }
  2459. }
  2460. a = core_type(left.type);
  2461. b = core_type(right.type);
  2462. lbValue res = {};
  2463. res.type = t_llvm_bool;
  2464. if (is_type_integer(a) ||
  2465. is_type_boolean(a) ||
  2466. is_type_pointer(a) ||
  2467. is_type_multi_pointer(a) ||
  2468. is_type_proc(a) ||
  2469. is_type_enum(a)) {
  2470. LLVMIntPredicate pred = {};
  2471. if (is_type_unsigned(left.type)) {
  2472. switch (op_kind) {
  2473. case Token_Gt: pred = LLVMIntUGT; break;
  2474. case Token_GtEq: pred = LLVMIntUGE; break;
  2475. case Token_Lt: pred = LLVMIntULT; break;
  2476. case Token_LtEq: pred = LLVMIntULE; break;
  2477. }
  2478. } else {
  2479. switch (op_kind) {
  2480. case Token_Gt: pred = LLVMIntSGT; break;
  2481. case Token_GtEq: pred = LLVMIntSGE; break;
  2482. case Token_Lt: pred = LLVMIntSLT; break;
  2483. case Token_LtEq: pred = LLVMIntSLE; break;
  2484. }
  2485. }
  2486. switch (op_kind) {
  2487. case Token_CmpEq: pred = LLVMIntEQ; break;
  2488. case Token_NotEq: pred = LLVMIntNE; break;
  2489. }
  2490. LLVMValueRef lhs = left.value;
  2491. LLVMValueRef rhs = right.value;
  2492. if (LLVMTypeOf(lhs) != LLVMTypeOf(rhs)) {
  2493. if (lb_is_type_kind(LLVMTypeOf(lhs), LLVMPointerTypeKind)) {
  2494. rhs = LLVMBuildPointerCast(p->builder, rhs, LLVMTypeOf(lhs), "");
  2495. }
  2496. }
  2497. if (is_type_different_to_arch_endianness(left.type)) {
  2498. Type *pt = integer_endian_type_to_platform_type(left.type);
  2499. lhs = lb_emit_byte_swap(p, {lhs, pt}, pt).value;
  2500. rhs = lb_emit_byte_swap(p, {rhs, pt}, pt).value;
  2501. }
  2502. res.value = LLVMBuildICmp(p->builder, pred, lhs, rhs, "");
  2503. } else if (is_type_float(a)) {
  2504. LLVMRealPredicate pred = {};
  2505. switch (op_kind) {
  2506. case Token_CmpEq: pred = LLVMRealOEQ; break;
  2507. case Token_Gt: pred = LLVMRealOGT; break;
  2508. case Token_GtEq: pred = LLVMRealOGE; break;
  2509. case Token_Lt: pred = LLVMRealOLT; break;
  2510. case Token_LtEq: pred = LLVMRealOLE; break;
  2511. case Token_NotEq: pred = LLVMRealONE; break;
  2512. }
  2513. if (is_type_different_to_arch_endianness(left.type)) {
  2514. Type *pt = integer_endian_type_to_platform_type(left.type);
  2515. left = lb_emit_byte_swap(p, left, pt);
  2516. right = lb_emit_byte_swap(p, right, pt);
  2517. }
  2518. res.value = LLVMBuildFCmp(p->builder, pred, left.value, right.value, "");
  2519. } else if (is_type_typeid(a)) {
  2520. LLVMIntPredicate pred = {};
  2521. switch (op_kind) {
  2522. case Token_Gt: pred = LLVMIntUGT; break;
  2523. case Token_GtEq: pred = LLVMIntUGE; break;
  2524. case Token_Lt: pred = LLVMIntULT; break;
  2525. case Token_LtEq: pred = LLVMIntULE; break;
  2526. case Token_CmpEq: pred = LLVMIntEQ; break;
  2527. case Token_NotEq: pred = LLVMIntNE; break;
  2528. }
  2529. res.value = LLVMBuildICmp(p->builder, pred, left.value, right.value, "");
  2530. } else if (is_type_simd_vector(a)) {
  2531. LLVMValueRef mask = nullptr;
  2532. Type *elem = base_array_type(a);
  2533. if (is_type_float(elem)) {
  2534. LLVMRealPredicate pred = {};
  2535. switch (op_kind) {
  2536. case Token_CmpEq: pred = LLVMRealOEQ; break;
  2537. case Token_NotEq: pred = LLVMRealONE; break;
  2538. }
  2539. mask = LLVMBuildFCmp(p->builder, pred, left.value, right.value, "");
  2540. } else {
  2541. LLVMIntPredicate pred = {};
  2542. switch (op_kind) {
  2543. case Token_CmpEq: pred = LLVMIntEQ; break;
  2544. case Token_NotEq: pred = LLVMIntNE; break;
  2545. }
  2546. mask = LLVMBuildICmp(p->builder, pred, left.value, right.value, "");
  2547. }
  2548. GB_ASSERT_MSG(mask != nullptr, "Unhandled comparison kind %s (%s) %.*s %s (%s)", type_to_string(left.type), type_to_string(base_type(left.type)), LIT(token_strings[op_kind]), type_to_string(right.type), type_to_string(base_type(right.type)));
  2549. /* NOTE(bill, 2022-05-28):
  2550. Thanks to Per Vognsen, sign extending <N x i1> to
  2551. a vector of the same width as the input vector, bit casting to an integer,
  2552. and then comparing against zero is the better option
  2553. See: https://lists.llvm.org/pipermail/llvm-dev/2012-September/053046.html
  2554. // Example assuming 128-bit vector
  2555. %1 = <4 x float> ...
  2556. %2 = <4 x float> ...
  2557. %3 = fcmp oeq <4 x float> %1, %2
  2558. %4 = sext <4 x i1> %3 to <4 x i32>
  2559. %5 = bitcast <4 x i32> %4 to i128
  2560. %6 = icmp ne i128 %5, 0
  2561. br i1 %6, label %true1, label %false2
  2562. This will result in 1 cmpps + 1 ptest + 1 br
  2563. (even without SSE4.1, contrary to what the mail list states, because of pmovmskb)
  2564. */
  2565. unsigned count = cast(unsigned)get_array_type_count(a);
  2566. unsigned elem_sz = cast(unsigned)(type_size_of(elem)*8);
  2567. LLVMTypeRef mask_type = LLVMVectorType(LLVMIntTypeInContext(p->module->ctx, elem_sz), count);
  2568. mask = LLVMBuildSExtOrBitCast(p->builder, mask, mask_type, "");
  2569. LLVMTypeRef mask_int_type = LLVMIntTypeInContext(p->module->ctx, cast(unsigned)(8*type_size_of(a)));
  2570. LLVMValueRef mask_int = LLVMBuildBitCast(p->builder, mask, mask_int_type, "");
  2571. switch (op_kind) {
  2572. case Token_CmpEq:
  2573. res.value = LLVMBuildICmp(p->builder, LLVMIntEQ, mask_int, LLVMConstInt(mask_int_type, U64_MAX, true), "");
  2574. break;
  2575. case Token_NotEq:
  2576. res.value = LLVMBuildICmp(p->builder, LLVMIntNE, mask_int, LLVMConstNull(mask_int_type), "");
  2577. break;
  2578. }
  2579. return res;
  2580. } else {
  2581. GB_PANIC("Unhandled comparison kind %s (%s) %.*s %s (%s)", type_to_string(left.type), type_to_string(base_type(left.type)), LIT(token_strings[op_kind]), type_to_string(right.type), type_to_string(base_type(right.type)));
  2582. }
  2583. return res;
  2584. }
  2585. gb_internal lbValue lb_emit_comp_against_nil(lbProcedure *p, TokenKind op_kind, lbValue x) {
  2586. lbValue res = {};
  2587. res.type = t_llvm_bool;
  2588. Type *t = x.type;
  2589. Type *bt = base_type(t);
  2590. TypeKind type_kind = bt->kind;
  2591. switch (type_kind) {
  2592. case Type_Basic:
  2593. switch (bt->Basic.kind) {
  2594. case Basic_rawptr:
  2595. case Basic_cstring:
  2596. if (op_kind == Token_CmpEq) {
  2597. res.value = LLVMBuildIsNull(p->builder, x.value, "");
  2598. } else if (op_kind == Token_NotEq) {
  2599. res.value = LLVMBuildIsNotNull(p->builder, x.value, "");
  2600. }
  2601. return res;
  2602. case Basic_any:
  2603. {
  2604. // TODO(bill): is this correct behaviour for nil comparison for any?
  2605. lbValue data = lb_emit_struct_ev(p, x, 0);
  2606. lbValue ti = lb_emit_struct_ev(p, x, 1);
  2607. if (op_kind == Token_CmpEq) {
  2608. LLVMValueRef a = LLVMBuildIsNull(p->builder, data.value, "");
  2609. LLVMValueRef b = LLVMBuildIsNull(p->builder, ti.value, "");
  2610. res.value = LLVMBuildOr(p->builder, a, b, "");
  2611. return res;
  2612. } else if (op_kind == Token_NotEq) {
  2613. LLVMValueRef a = LLVMBuildIsNotNull(p->builder, data.value, "");
  2614. LLVMValueRef b = LLVMBuildIsNotNull(p->builder, ti.value, "");
  2615. res.value = LLVMBuildAnd(p->builder, a, b, "");
  2616. return res;
  2617. }
  2618. }
  2619. break;
  2620. case Basic_typeid:
  2621. lbValue invalid_typeid = lb_const_value(p->module, t_typeid, exact_value_i64(0));
  2622. return lb_emit_comp(p, op_kind, x, invalid_typeid);
  2623. }
  2624. break;
  2625. case Type_Enum:
  2626. case Type_Pointer:
  2627. case Type_MultiPointer:
  2628. case Type_Proc:
  2629. if (op_kind == Token_CmpEq) {
  2630. res.value = LLVMBuildIsNull(p->builder, x.value, "");
  2631. } else if (op_kind == Token_NotEq) {
  2632. res.value = LLVMBuildIsNotNull(p->builder, x.value, "");
  2633. }
  2634. return res;
  2635. case Type_BitSet:
  2636. {
  2637. Type *u = bit_set_to_int(bt);
  2638. if (is_type_array(u)) {
  2639. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2640. lbValue lhs = lb_address_from_load_or_generate_local(p, x);
  2641. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2642. args[1] = lb_const_int(p->module, t_int, type_size_of(t));
  2643. lbValue val = lb_emit_runtime_call(p, "memory_compare_zero", args);
  2644. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_int(p->module, t_int, 0));
  2645. return res;
  2646. } else {
  2647. if (op_kind == Token_CmpEq) {
  2648. res.value = LLVMBuildIsNull(p->builder, x.value, "");
  2649. } else if (op_kind == Token_NotEq) {
  2650. res.value = LLVMBuildIsNotNull(p->builder, x.value, "");
  2651. }
  2652. }
  2653. return res;
  2654. }
  2655. case Type_Slice:
  2656. {
  2657. lbValue data = lb_emit_struct_ev(p, x, 0);
  2658. if (op_kind == Token_CmpEq) {
  2659. res.value = LLVMBuildIsNull(p->builder, data.value, "");
  2660. return res;
  2661. } else if (op_kind == Token_NotEq) {
  2662. res.value = LLVMBuildIsNotNull(p->builder, data.value, "");
  2663. return res;
  2664. }
  2665. }
  2666. break;
  2667. case Type_DynamicArray:
  2668. {
  2669. lbValue data = lb_emit_struct_ev(p, x, 0);
  2670. if (op_kind == Token_CmpEq) {
  2671. res.value = LLVMBuildIsNull(p->builder, data.value, "");
  2672. return res;
  2673. } else if (op_kind == Token_NotEq) {
  2674. res.value = LLVMBuildIsNotNull(p->builder, data.value, "");
  2675. return res;
  2676. }
  2677. }
  2678. break;
  2679. case Type_Map:
  2680. {
  2681. lbValue data_ptr = lb_emit_struct_ev(p, x, 0);
  2682. if (op_kind == Token_CmpEq) {
  2683. res.value = LLVMBuildIsNull(p->builder, data_ptr.value, "");
  2684. return res;
  2685. } else {
  2686. res.value = LLVMBuildIsNotNull(p->builder, data_ptr.value, "");
  2687. return res;
  2688. }
  2689. }
  2690. break;
  2691. case Type_Union:
  2692. {
  2693. if (type_size_of(t) == 0) {
  2694. if (op_kind == Token_CmpEq) {
  2695. return lb_const_bool(p->module, t_llvm_bool, true);
  2696. } else if (op_kind == Token_NotEq) {
  2697. return lb_const_bool(p->module, t_llvm_bool, false);
  2698. }
  2699. } else if (is_type_union_maybe_pointer(t)) {
  2700. lbValue tag = lb_emit_transmute(p, x, t_rawptr);
  2701. return lb_emit_comp_against_nil(p, op_kind, tag);
  2702. } else {
  2703. lbValue tag = lb_emit_union_tag_value(p, x);
  2704. return lb_emit_comp(p, op_kind, tag, lb_zero(p->module, tag.type));
  2705. }
  2706. }
  2707. case Type_Struct:
  2708. if (is_type_soa_struct(t)) {
  2709. Type *bt = base_type(t);
  2710. if (bt->Struct.soa_kind == StructSoa_Slice) {
  2711. LLVMValueRef the_value = {};
  2712. if (bt->Struct.fields.count == 0) {
  2713. lbValue len = lb_soa_struct_len(p, x);
  2714. the_value = len.value;
  2715. } else {
  2716. lbValue first_field = lb_emit_struct_ev(p, x, 0);
  2717. the_value = first_field.value;
  2718. }
  2719. if (op_kind == Token_CmpEq) {
  2720. res.value = LLVMBuildIsNull(p->builder, the_value, "");
  2721. return res;
  2722. } else if (op_kind == Token_NotEq) {
  2723. res.value = LLVMBuildIsNotNull(p->builder, the_value, "");
  2724. return res;
  2725. }
  2726. } else if (bt->Struct.soa_kind == StructSoa_Dynamic) {
  2727. LLVMValueRef the_value = {};
  2728. if (bt->Struct.fields.count == 0) {
  2729. lbValue cap = lb_soa_struct_cap(p, x);
  2730. the_value = cap.value;
  2731. } else {
  2732. lbValue first_field = lb_emit_struct_ev(p, x, 0);
  2733. the_value = first_field.value;
  2734. }
  2735. if (op_kind == Token_CmpEq) {
  2736. res.value = LLVMBuildIsNull(p->builder, the_value, "");
  2737. return res;
  2738. } else if (op_kind == Token_NotEq) {
  2739. res.value = LLVMBuildIsNotNull(p->builder, the_value, "");
  2740. return res;
  2741. }
  2742. }
  2743. } else if (is_type_struct(t) && type_has_nil(t)) {
  2744. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2745. lbValue lhs = lb_address_from_load_or_generate_local(p, x);
  2746. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2747. args[1] = lb_const_int(p->module, t_int, type_size_of(t));
  2748. lbValue val = lb_emit_runtime_call(p, "memory_compare_zero", args);
  2749. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_int(p->module, t_int, 0));
  2750. return res;
  2751. }
  2752. break;
  2753. }
  2754. GB_PANIC("Unknown handled type: %s -> %s", type_to_string(t), type_to_string(bt));
  2755. return {};
  2756. }
  2757. gb_internal lbValue lb_build_unary_and(lbProcedure *p, Ast *expr) {
  2758. ast_node(ue, UnaryExpr, expr);
  2759. auto tv = type_and_value_of_expr(expr);
  2760. Ast *ue_expr = unparen_expr(ue->expr);
  2761. if (ue_expr->kind == Ast_IndexExpr && tv.mode == Addressing_OptionalOkPtr && is_type_tuple(tv.type)) {
  2762. Type *tuple = tv.type;
  2763. Type *map_type = type_of_expr(ue_expr->IndexExpr.expr);
  2764. Type *ot = base_type(map_type);
  2765. Type *t = base_type(type_deref(ot));
  2766. bool deref = t != ot;
  2767. GB_ASSERT(t->kind == Type_Map);
  2768. ast_node(ie, IndexExpr, ue_expr);
  2769. lbValue map_val = lb_build_addr_ptr(p, ie->expr);
  2770. if (deref) {
  2771. map_val = lb_emit_load(p, map_val);
  2772. }
  2773. lbValue key = lb_build_expr(p, ie->index);
  2774. key = lb_emit_conv(p, key, t->Map.key);
  2775. lbAddr addr = lb_addr_map(map_val, key, t, alloc_type_pointer(t->Map.value));
  2776. lbValue ptr = lb_addr_get_ptr(p, addr);
  2777. lbValue ok = lb_emit_comp_against_nil(p, Token_NotEq, ptr);
  2778. ok = lb_emit_conv(p, ok, tuple->Tuple.variables[1]->type);
  2779. lbAddr res = lb_add_local_generated(p, tuple, false);
  2780. lbValue gep0 = lb_emit_struct_ep(p, res.addr, 0);
  2781. lbValue gep1 = lb_emit_struct_ep(p, res.addr, 1);
  2782. lb_emit_store(p, gep0, ptr);
  2783. lb_emit_store(p, gep1, ok);
  2784. return lb_addr_load(p, res);
  2785. } else if (is_type_soa_pointer(tv.type)) {
  2786. ast_node(ie, IndexExpr, ue_expr);
  2787. lbValue addr = lb_build_addr_ptr(p, ie->expr);
  2788. if (is_type_pointer(type_deref(addr.type))) {
  2789. addr = lb_emit_load(p, addr);
  2790. }
  2791. GB_ASSERT(is_type_pointer(addr.type));
  2792. lbValue index = lb_build_expr(p, ie->index);
  2793. if (!build_context.no_bounds_check) {
  2794. // TODO(bill): soa bounds checking
  2795. }
  2796. return lb_make_soa_pointer(p, tv.type, addr, index);
  2797. } else if (ue_expr->kind == Ast_CompoundLit) {
  2798. lbValue v = lb_build_expr(p, ue->expr);
  2799. Type *type = v.type;
  2800. lbAddr addr = {};
  2801. if (p->is_startup) {
  2802. addr = lb_add_global_generated(p->module, type, v);
  2803. } else {
  2804. addr = lb_add_local_generated(p, type, false);
  2805. }
  2806. lb_addr_store(p, addr, v);
  2807. return addr.addr;
  2808. } else if (ue_expr->kind == Ast_TypeAssertion) {
  2809. if (is_type_tuple(tv.type)) {
  2810. Type *tuple = tv.type;
  2811. Type *ptr_type = tuple->Tuple.variables[0]->type;
  2812. Type *ok_type = tuple->Tuple.variables[1]->type;
  2813. ast_node(ta, TypeAssertion, ue_expr);
  2814. TokenPos pos = ast_token(expr).pos;
  2815. Type *type = type_of_expr(ue_expr);
  2816. GB_ASSERT(!is_type_tuple(type));
  2817. lbValue e = lb_build_expr(p, ta->expr);
  2818. Type *t = type_deref(e.type);
  2819. if (is_type_union(t)) {
  2820. lbValue v = e;
  2821. if (!is_type_pointer(v.type)) {
  2822. v = lb_address_from_load_or_generate_local(p, v);
  2823. }
  2824. Type *src_type = type_deref(v.type);
  2825. Type *dst_type = type;
  2826. lbValue src_tag = {};
  2827. lbValue dst_tag = {};
  2828. if (is_type_union_maybe_pointer(src_type)) {
  2829. src_tag = lb_emit_comp_against_nil(p, Token_NotEq, v);
  2830. dst_tag = lb_const_bool(p->module, t_bool, true);
  2831. } else {
  2832. src_tag = lb_emit_load(p, lb_emit_union_tag_ptr(p, v));
  2833. dst_tag = lb_const_union_tag(p->module, src_type, dst_type);
  2834. }
  2835. lbValue ok = lb_emit_comp(p, Token_CmpEq, src_tag, dst_tag);
  2836. lbValue data_ptr = lb_emit_conv(p, v, ptr_type);
  2837. lbAddr res = lb_add_local_generated(p, tuple, true);
  2838. lbValue gep0 = lb_emit_struct_ep(p, res.addr, 0);
  2839. lbValue gep1 = lb_emit_struct_ep(p, res.addr, 1);
  2840. lb_emit_store(p, gep0, lb_emit_select(p, ok, data_ptr, lb_const_nil(p->module, ptr_type)));
  2841. lb_emit_store(p, gep1, lb_emit_conv(p, ok, ok_type));
  2842. return lb_addr_load(p, res);
  2843. } else if (is_type_any(t)) {
  2844. lbValue v = e;
  2845. if (is_type_pointer(v.type)) {
  2846. v = lb_emit_load(p, v);
  2847. }
  2848. lbValue data_ptr = lb_emit_conv(p, lb_emit_struct_ev(p, v, 0), ptr_type);
  2849. lbValue any_id = lb_emit_struct_ev(p, v, 1);
  2850. lbValue id = lb_typeid(p->module, type);
  2851. lbValue ok = lb_emit_comp(p, Token_CmpEq, any_id, id);
  2852. lbAddr res = lb_add_local_generated(p, tuple, false);
  2853. lbValue gep0 = lb_emit_struct_ep(p, res.addr, 0);
  2854. lbValue gep1 = lb_emit_struct_ep(p, res.addr, 1);
  2855. lb_emit_store(p, gep0, lb_emit_select(p, ok, data_ptr, lb_const_nil(p->module, ptr_type)));
  2856. lb_emit_store(p, gep1, lb_emit_conv(p, ok, ok_type));
  2857. return lb_addr_load(p, res);
  2858. } else {
  2859. GB_PANIC("TODO(bill): type assertion %s", type_to_string(type));
  2860. }
  2861. } else {
  2862. GB_ASSERT(is_type_pointer(tv.type));
  2863. ast_node(ta, TypeAssertion, ue_expr);
  2864. TokenPos pos = ast_token(expr).pos;
  2865. Type *type = type_of_expr(ue_expr);
  2866. GB_ASSERT(!is_type_tuple(type));
  2867. lbValue e = lb_build_expr(p, ta->expr);
  2868. Type *t = type_deref(e.type);
  2869. if (is_type_union(t)) {
  2870. lbValue v = e;
  2871. if (!is_type_pointer(v.type)) {
  2872. v = lb_address_from_load_or_generate_local(p, v);
  2873. }
  2874. Type *src_type = type_deref(v.type);
  2875. Type *dst_type = type;
  2876. if (!build_context.no_type_assert && (p->state_flags & StateFlag_no_type_assert) == 0) {
  2877. lbValue src_tag = {};
  2878. lbValue dst_tag = {};
  2879. if (is_type_union_maybe_pointer(src_type)) {
  2880. src_tag = lb_emit_comp_against_nil(p, Token_NotEq, v);
  2881. dst_tag = lb_const_bool(p->module, t_bool, true);
  2882. } else {
  2883. src_tag = lb_emit_load(p, lb_emit_union_tag_ptr(p, v));
  2884. dst_tag = lb_const_union_tag(p->module, src_type, dst_type);
  2885. }
  2886. isize arg_count = 6;
  2887. if (build_context.no_rtti) {
  2888. arg_count = 4;
  2889. }
  2890. lbValue ok = lb_emit_comp(p, Token_CmpEq, src_tag, dst_tag);
  2891. auto args = array_make<lbValue>(permanent_allocator(), arg_count);
  2892. args[0] = ok;
  2893. lb_set_file_line_col(p, array_slice(args, 1, args.count), pos);
  2894. if (!build_context.no_rtti) {
  2895. args[4] = lb_typeid(p->module, src_type);
  2896. args[5] = lb_typeid(p->module, dst_type);
  2897. }
  2898. lb_emit_runtime_call(p, "type_assertion_check", args);
  2899. }
  2900. lbValue data_ptr = v;
  2901. return lb_emit_conv(p, data_ptr, tv.type);
  2902. } else if (is_type_any(t)) {
  2903. lbValue v = e;
  2904. if (is_type_pointer(v.type)) {
  2905. v = lb_emit_load(p, v);
  2906. }
  2907. lbValue data_ptr = lb_emit_struct_ev(p, v, 0);
  2908. if (!build_context.no_type_assert && (p->state_flags & StateFlag_no_type_assert) == 0) {
  2909. GB_ASSERT(!build_context.no_rtti);
  2910. lbValue any_id = lb_emit_struct_ev(p, v, 1);
  2911. lbValue id = lb_typeid(p->module, type);
  2912. lbValue ok = lb_emit_comp(p, Token_CmpEq, any_id, id);
  2913. auto args = array_make<lbValue>(permanent_allocator(), 6);
  2914. args[0] = ok;
  2915. lb_set_file_line_col(p, array_slice(args, 1, args.count), pos);
  2916. args[4] = any_id;
  2917. args[5] = id;
  2918. lb_emit_runtime_call(p, "type_assertion_check", args);
  2919. }
  2920. return lb_emit_conv(p, data_ptr, tv.type);
  2921. } else {
  2922. GB_PANIC("TODO(bill): type assertion %s", type_to_string(type));
  2923. }
  2924. }
  2925. }
  2926. return lb_build_addr_ptr(p, ue->expr);
  2927. }
  2928. gb_internal lbValue lb_build_expr_internal(lbProcedure *p, Ast *expr);
  2929. gb_internal lbValue lb_build_expr(lbProcedure *p, Ast *expr) {
  2930. u16 prev_state_flags = p->state_flags;
  2931. defer (p->state_flags = prev_state_flags);
  2932. if (expr->state_flags != 0) {
  2933. u16 in = expr->state_flags;
  2934. u16 out = p->state_flags;
  2935. if (in & StateFlag_bounds_check) {
  2936. out |= StateFlag_bounds_check;
  2937. out &= ~StateFlag_no_bounds_check;
  2938. } else if (in & StateFlag_no_bounds_check) {
  2939. out |= StateFlag_no_bounds_check;
  2940. out &= ~StateFlag_bounds_check;
  2941. }
  2942. if (in & StateFlag_type_assert) {
  2943. out |= StateFlag_type_assert;
  2944. out &= ~StateFlag_no_type_assert;
  2945. } else if (in & StateFlag_no_type_assert) {
  2946. out |= StateFlag_no_type_assert;
  2947. out &= ~StateFlag_type_assert;
  2948. }
  2949. p->state_flags = out;
  2950. }
  2951. // IMPORTANT NOTE(bill):
  2952. // Selector Call Expressions (foo->bar(...))
  2953. // must only evaluate `foo` once as it gets transformed into
  2954. // `foo.bar(foo, ...)`
  2955. // And if `foo` is a procedure call or something more complex, storing the value
  2956. // once is a very good idea
  2957. // If a stored value is found, it must be removed from the cache
  2958. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  2959. lbValue *pp = map_get(&p->selector_values, expr);
  2960. if (pp != nullptr) {
  2961. lbValue res = *pp;
  2962. map_remove(&p->selector_values, expr);
  2963. return res;
  2964. }
  2965. lbAddr *pa = map_get(&p->selector_addr, expr);
  2966. if (pa != nullptr) {
  2967. lbAddr res = *pa;
  2968. map_remove(&p->selector_addr, expr);
  2969. return lb_addr_load(p, res);
  2970. }
  2971. }
  2972. lbValue res = lb_build_expr_internal(p, expr);
  2973. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  2974. map_set(&p->selector_values, expr, res);
  2975. }
  2976. return res;
  2977. }
  2978. gb_internal lbValue lb_build_expr_internal(lbProcedure *p, Ast *expr) {
  2979. lbModule *m = p->module;
  2980. expr = unparen_expr(expr);
  2981. TokenPos expr_pos = ast_token(expr).pos;
  2982. TypeAndValue tv = type_and_value_of_expr(expr);
  2983. Type *type = type_of_expr(expr);
  2984. GB_ASSERT_MSG(tv.mode != Addressing_Invalid, "invalid expression '%s' (tv.mode = %d, tv.type = %s) @ %s\n Current Proc: %.*s : %s", expr_to_string(expr), tv.mode, type_to_string(tv.type), token_pos_to_string(expr_pos), LIT(p->name), type_to_string(p->type));
  2985. if (tv.value.kind != ExactValue_Invalid) {
  2986. // NOTE(bill): Short on constant values
  2987. return lb_const_value(p->module, type, tv.value);
  2988. } else if (tv.mode == Addressing_Type) {
  2989. // NOTE(bill, 2023-01-16): is this correct? I hope so at least
  2990. return lb_typeid(m, tv.type);
  2991. }
  2992. switch (expr->kind) {
  2993. case_ast_node(bl, BasicLit, expr);
  2994. if (type != nullptr && type->Named.name == "Error") {
  2995. Entity *e = type->Named.type_name;
  2996. if (e->pkg && e->pkg->name == "os") {
  2997. return lb_const_nil(p->module, type);
  2998. }
  2999. }
  3000. TokenPos pos = bl->token.pos;
  3001. GB_PANIC("Non-constant basic literal %s - %.*s (%s)", token_pos_to_string(pos), LIT(token_strings[bl->token.kind]), type_to_string(type));
  3002. case_end;
  3003. case_ast_node(bd, BasicDirective, expr);
  3004. TokenPos pos = bd->token.pos;
  3005. String name = bd->name.string;
  3006. if (name == "branch_location") {
  3007. GB_ASSERT(p->uses_branch_location);
  3008. String proc_name = p->entity->token.string;
  3009. return lb_emit_source_code_location_as_global(p, proc_name, p->branch_location_pos);
  3010. }
  3011. GB_PANIC("Non-constant basic literal %s - %.*s", token_pos_to_string(pos), LIT(name));
  3012. case_end;
  3013. case_ast_node(i, Implicit, expr);
  3014. return lb_addr_load(p, lb_build_addr(p, expr));
  3015. case_end;
  3016. case_ast_node(u, Uninit, expr)
  3017. lbValue res = {};
  3018. if (is_type_untyped(type)) {
  3019. res.value = nullptr;
  3020. res.type = t_untyped_uninit;
  3021. } else {
  3022. res.value = LLVMGetUndef(lb_type(m, type));
  3023. res.type = type;
  3024. }
  3025. return res;
  3026. case_end;
  3027. case_ast_node(i, Ident, expr);
  3028. Entity *e = entity_from_expr(expr);
  3029. e = strip_entity_wrapping(e);
  3030. GB_ASSERT_MSG(e != nullptr, "%s in %.*s %p", expr_to_string(expr), LIT(p->name), expr);
  3031. if (e->kind == Entity_Builtin) {
  3032. Token token = ast_token(expr);
  3033. GB_PANIC("TODO(bill): lb_build_expr Entity_Builtin '%.*s'\n"
  3034. "\t at %s", LIT(builtin_procs[e->Builtin.id].name),
  3035. token_pos_to_string(token.pos));
  3036. return {};
  3037. } else if (e->kind == Entity_Nil) {
  3038. lbValue res = {};
  3039. res.value = nullptr;
  3040. res.type = e->type;
  3041. return res;
  3042. }
  3043. GB_ASSERT(e->kind != Entity_ProcGroup);
  3044. return lb_find_ident(p, m, e, expr);
  3045. case_end;
  3046. case_ast_node(de, DerefExpr, expr);
  3047. return lb_addr_load(p, lb_build_addr(p, expr));
  3048. case_end;
  3049. case_ast_node(se, SelectorExpr, expr);
  3050. TypeAndValue tav = type_and_value_of_expr(expr);
  3051. GB_ASSERT(tav.mode != Addressing_Invalid);
  3052. return lb_addr_load(p, lb_build_addr(p, expr));
  3053. case_end;
  3054. case_ast_node(ise, ImplicitSelectorExpr, expr);
  3055. TypeAndValue tav = type_and_value_of_expr(expr);
  3056. GB_ASSERT(tav.mode == Addressing_Constant);
  3057. return lb_const_value(p->module, type, tv.value);
  3058. case_end;
  3059. case_ast_node(se, SelectorCallExpr, expr);
  3060. GB_ASSERT(se->modified_call);
  3061. return lb_build_call_expr(p, se->call);
  3062. case_end;
  3063. case_ast_node(te, TernaryIfExpr, expr);
  3064. LLVMValueRef incoming_values[2] = {};
  3065. LLVMBasicBlockRef incoming_blocks[2] = {};
  3066. GB_ASSERT(te->y != nullptr);
  3067. lbBlock *then = lb_create_block(p, "if.then");
  3068. lbBlock *done = lb_create_block(p, "if.done"); // NOTE(bill): Append later
  3069. lbBlock *else_ = lb_create_block(p, "if.else");
  3070. lb_build_cond(p, te->cond, then, else_);
  3071. lb_start_block(p, then);
  3072. Type *type = default_type(type_of_expr(expr));
  3073. LLVMTypeRef llvm_type = lb_type(p->module, type);
  3074. incoming_values[0] = lb_emit_conv(p, lb_build_expr(p, te->x), type).value;
  3075. if (is_type_internally_pointer_like(type)) {
  3076. incoming_values[0] = LLVMBuildBitCast(p->builder, incoming_values[0], llvm_type, "");
  3077. }
  3078. lb_emit_jump(p, done);
  3079. lb_start_block(p, else_);
  3080. incoming_values[1] = lb_emit_conv(p, lb_build_expr(p, te->y), type).value;
  3081. if (is_type_internally_pointer_like(type)) {
  3082. incoming_values[1] = LLVMBuildBitCast(p->builder, incoming_values[1], llvm_type, "");
  3083. }
  3084. lb_emit_jump(p, done);
  3085. lb_start_block(p, done);
  3086. lbValue res = {};
  3087. res.value = LLVMBuildPhi(p->builder, llvm_type, "");
  3088. res.type = type;
  3089. GB_ASSERT(p->curr_block->preds.count >= 2);
  3090. incoming_blocks[0] = p->curr_block->preds[0]->block;
  3091. incoming_blocks[1] = p->curr_block->preds[1]->block;
  3092. LLVMAddIncoming(res.value, incoming_values, incoming_blocks, 2);
  3093. return res;
  3094. case_end;
  3095. case_ast_node(te, TernaryWhenExpr, expr);
  3096. TypeAndValue tav = type_and_value_of_expr(te->cond);
  3097. GB_ASSERT(tav.mode == Addressing_Constant);
  3098. GB_ASSERT(tav.value.kind == ExactValue_Bool);
  3099. if (tav.value.value_bool) {
  3100. return lb_build_expr(p, te->x);
  3101. } else {
  3102. return lb_build_expr(p, te->y);
  3103. }
  3104. case_end;
  3105. case_ast_node(oe, OrElseExpr, expr);
  3106. return lb_emit_or_else(p, oe->x, oe->y, tv);
  3107. case_end;
  3108. case_ast_node(oe, OrReturnExpr, expr);
  3109. return lb_emit_or_return(p, oe->expr, tv);
  3110. case_end;
  3111. case_ast_node(be, OrBranchExpr, expr);
  3112. lbBlock *block = nullptr;
  3113. if (be->label != nullptr) {
  3114. lbBranchBlocks bb = lb_lookup_branch_blocks(p, be->label);
  3115. switch (be->token.kind) {
  3116. case Token_or_break: block = bb.break_; break;
  3117. case Token_or_continue: block = bb.continue_; break;
  3118. }
  3119. } else {
  3120. for (lbTargetList *t = p->target_list; t != nullptr && block == nullptr; t = t->prev) {
  3121. if (t->is_block) {
  3122. continue;
  3123. }
  3124. switch (be->token.kind) {
  3125. case Token_or_break: block = t->break_; break;
  3126. case Token_or_continue: block = t->continue_; break;
  3127. }
  3128. }
  3129. }
  3130. GB_ASSERT(block != nullptr);
  3131. lbValue lhs = {};
  3132. lbValue rhs = {};
  3133. lb_emit_try_lhs_rhs(p, be->expr, tv, &lhs, &rhs);
  3134. Type *type = default_type(tv.type);
  3135. if (lhs.value) {
  3136. lhs = lb_emit_conv(p, lhs, type);
  3137. } else if (type != nullptr && type != t_invalid) {
  3138. lhs = lb_const_nil(p->module, type);
  3139. }
  3140. lbBlock *then = lb_create_block(p, "or_branch.then");
  3141. lbBlock *else_ = lb_create_block(p, "or_branch.else");
  3142. lb_emit_if(p, lb_emit_try_has_value(p, rhs), then, else_);
  3143. lb_start_block(p, else_);
  3144. lb_emit_defer_stmts(p, lbDeferExit_Branch, block, expr);
  3145. lb_emit_jump(p, block);
  3146. lb_start_block(p, then);
  3147. return lhs;
  3148. case_end;
  3149. case_ast_node(ta, TypeAssertion, expr);
  3150. TokenPos pos = ast_token(expr).pos;
  3151. lbValue e = lb_build_expr(p, ta->expr);
  3152. Type *t = type_deref(e.type);
  3153. if (is_type_union(t)) {
  3154. if (ta->ignores[0]) {
  3155. // NOTE(bill): This is not needed for optimization levels other than 0
  3156. return lb_emit_union_cast_only_ok_check(p, e, type, pos);
  3157. }
  3158. return lb_emit_union_cast(p, e, type, pos);
  3159. } else if (is_type_any(t)) {
  3160. return lb_emit_any_cast(p, e, type, pos);
  3161. } else {
  3162. GB_PANIC("TODO(bill): type assertion %s", type_to_string(e.type));
  3163. }
  3164. case_end;
  3165. case_ast_node(tc, TypeCast, expr);
  3166. lbValue e = lb_build_expr(p, tc->expr);
  3167. switch (tc->token.kind) {
  3168. case Token_cast:
  3169. return lb_emit_conv(p, e, type);
  3170. case Token_transmute:
  3171. return lb_emit_transmute(p, e, type);
  3172. }
  3173. GB_PANIC("Invalid AST TypeCast");
  3174. case_end;
  3175. case_ast_node(ac, AutoCast, expr);
  3176. lbValue value = lb_build_expr(p, ac->expr);
  3177. return lb_emit_conv(p, value, type);
  3178. case_end;
  3179. case_ast_node(ue, UnaryExpr, expr);
  3180. switch (ue->op.kind) {
  3181. case Token_And:
  3182. return lb_build_unary_and(p, expr);
  3183. default:
  3184. {
  3185. lbValue v = lb_build_expr(p, ue->expr);
  3186. return lb_emit_unary_arith(p, ue->op.kind, v, type);
  3187. }
  3188. }
  3189. case_end;
  3190. case_ast_node(be, BinaryExpr, expr);
  3191. return lb_build_binary_expr(p, expr);
  3192. case_end;
  3193. case_ast_node(pl, ProcLit, expr);
  3194. return lb_generate_anonymous_proc_lit(p->module, p->name, expr, p);
  3195. case_end;
  3196. case_ast_node(cl, CompoundLit, expr);
  3197. return lb_addr_load(p, lb_build_addr(p, expr));
  3198. case_end;
  3199. case_ast_node(ce, CallExpr, expr);
  3200. return lb_build_call_expr(p, expr);
  3201. case_end;
  3202. case_ast_node(se, SliceExpr, expr);
  3203. if (is_type_slice(type_of_expr(se->expr))) {
  3204. // NOTE(bill): Quick optimization
  3205. if (se->high == nullptr &&
  3206. (se->low == nullptr || lb_is_expr_constant_zero(se->low))) {
  3207. return lb_build_expr(p, se->expr);
  3208. }
  3209. }
  3210. return lb_addr_load(p, lb_build_addr(p, expr));
  3211. case_end;
  3212. case_ast_node(ie, IndexExpr, expr);
  3213. return lb_addr_load(p, lb_build_addr(p, expr));
  3214. case_end;
  3215. case_ast_node(ie, MatrixIndexExpr, expr);
  3216. return lb_addr_load(p, lb_build_addr(p, expr));
  3217. case_end;
  3218. case_ast_node(ia, InlineAsmExpr, expr);
  3219. Type *t = type_of_expr(expr);
  3220. GB_ASSERT(is_type_asm_proc(t));
  3221. String asm_string = {};
  3222. String constraints_string = {};
  3223. TypeAndValue tav;
  3224. tav = type_and_value_of_expr(ia->asm_string);
  3225. GB_ASSERT(is_type_string(tav.type));
  3226. GB_ASSERT(tav.value.kind == ExactValue_String);
  3227. asm_string = tav.value.value_string;
  3228. tav = type_and_value_of_expr(ia->constraints_string);
  3229. GB_ASSERT(is_type_string(tav.type));
  3230. GB_ASSERT(tav.value.kind == ExactValue_String);
  3231. constraints_string = tav.value.value_string;
  3232. LLVMInlineAsmDialect dialect = LLVMInlineAsmDialectATT;
  3233. switch (ia->dialect) {
  3234. case InlineAsmDialect_Default: dialect = LLVMInlineAsmDialectATT; break;
  3235. case InlineAsmDialect_ATT: dialect = LLVMInlineAsmDialectATT; break;
  3236. case InlineAsmDialect_Intel: dialect = LLVMInlineAsmDialectIntel; break;
  3237. default: GB_PANIC("Unhandled inline asm dialect"); break;
  3238. }
  3239. LLVMTypeRef func_type = lb_type_internal_for_procedures_raw(p->module, t);
  3240. LLVMValueRef the_asm = llvm_get_inline_asm(func_type, asm_string, constraints_string, ia->has_side_effects, ia->has_side_effects, dialect);
  3241. GB_ASSERT(the_asm != nullptr);
  3242. return {the_asm, t};
  3243. case_end;
  3244. }
  3245. GB_PANIC("lb_build_expr: %.*s", LIT(ast_strings[expr->kind]));
  3246. return {};
  3247. }
  3248. gb_internal lbAddr lb_get_soa_variable_addr(lbProcedure *p, Entity *e) {
  3249. return map_must_get(&p->module->soa_values, e);
  3250. }
  3251. gb_internal lbValue lb_get_using_variable(lbProcedure *p, Entity *e) {
  3252. GB_ASSERT(e->kind == Entity_Variable && e->flags & EntityFlag_Using);
  3253. String name = e->token.string;
  3254. Entity *parent = e->using_parent;
  3255. Selection sel = lookup_field(parent->type, name, false);
  3256. GB_ASSERT(sel.entity != nullptr);
  3257. lbValue *pv = map_get(&p->module->values, parent);
  3258. lbValue v = {};
  3259. bool is_soa = false;
  3260. if (pv == nullptr && parent->flags & EntityFlag_SoaPtrField) {
  3261. is_soa = true;
  3262. // NOTE(bill): using SOA value (probably from for-in statement)
  3263. lbAddr parent_addr = lb_get_soa_variable_addr(p, parent);
  3264. v = lb_addr_get_ptr(p, parent_addr);
  3265. } else if (pv != nullptr) {
  3266. v = *pv;
  3267. } else {
  3268. GB_ASSERT_MSG(e->using_expr != nullptr, "%.*s", LIT(name));
  3269. v = lb_build_addr_ptr(p, e->using_expr);
  3270. }
  3271. GB_ASSERT(v.value != nullptr);
  3272. GB_ASSERT_MSG(is_soa || parent->type == type_deref(v.type), "%s %s", type_to_string(parent->type), type_to_string(v.type));
  3273. lbValue ptr = lb_emit_deep_field_gep(p, v, sel);
  3274. if (parent->scope) {
  3275. if ((parent->scope->flags & (ScopeFlag_File|ScopeFlag_Pkg)) == 0) {
  3276. lb_add_debug_local_variable(p, ptr.value, e->type, e->token);
  3277. }
  3278. } else {
  3279. lb_add_debug_local_variable(p, ptr.value, e->type, e->token);
  3280. }
  3281. return ptr;
  3282. }
  3283. gb_internal lbAddr lb_build_addr_from_entity(lbProcedure *p, Entity *e, Ast *expr) {
  3284. GB_ASSERT(e != nullptr);
  3285. if (e->kind == Entity_Constant) {
  3286. Type *t = default_type(type_of_expr(expr));
  3287. lbValue v = lb_const_value(p->module, t, e->Constant.value);
  3288. if (LLVMIsConstant(v.value)) {
  3289. lbAddr g = lb_add_global_generated(p->module, t, v);
  3290. return g;
  3291. }
  3292. GB_ASSERT(LLVMIsALoadInst(v.value));
  3293. lbValue ptr = {};
  3294. ptr.value = LLVMGetOperand(v.value, 0);
  3295. ptr.type = alloc_type_pointer(t);
  3296. return lb_addr(ptr);
  3297. }
  3298. lbValue v = {};
  3299. lbValue *found = map_get(&p->module->values, e);
  3300. if (found) {
  3301. v = *found;
  3302. } else if (e->kind == Entity_Variable && e->flags & EntityFlag_Using) {
  3303. // NOTE(bill): Calculate the using variable every time
  3304. v = lb_get_using_variable(p, e);
  3305. } else if (e->flags & EntityFlag_SoaPtrField) {
  3306. return lb_get_soa_variable_addr(p, e);
  3307. }
  3308. if (v.value == nullptr) {
  3309. return lb_addr(lb_find_value_from_entity(p->module, e));
  3310. // error(expr, "%.*s Unknown value: %.*s, entity: %p %.*s",
  3311. // LIT(p->name),
  3312. // LIT(e->token.string), e, LIT(entity_strings[e->kind]));
  3313. // GB_PANIC("Unknown value");
  3314. }
  3315. return lb_addr(v);
  3316. }
  3317. gb_internal lbAddr lb_build_array_swizzle_addr(lbProcedure *p, AstCallExpr *ce, TypeAndValue const &tv) {
  3318. isize index_count = ce->args.count-1;
  3319. lbAddr addr = lb_build_addr(p, ce->args[0]);
  3320. if (index_count == 0) {
  3321. return addr;
  3322. }
  3323. Type *type = base_type(lb_addr_type(addr));
  3324. GB_ASSERT(type->kind == Type_Array);
  3325. i64 count = type->Array.count;
  3326. if (count <= 4 && index_count <= 4) {
  3327. u8 indices[4] = {};
  3328. u8 index_count = 0;
  3329. for (i32 i = 1; i < ce->args.count; i++) {
  3330. TypeAndValue tv = type_and_value_of_expr(ce->args[i]);
  3331. GB_ASSERT(is_type_integer(tv.type));
  3332. GB_ASSERT(tv.value.kind == ExactValue_Integer);
  3333. i64 src_index = big_int_to_i64(&tv.value.value_integer);
  3334. indices[index_count++] = cast(u8)src_index;
  3335. }
  3336. return lb_addr_swizzle(lb_addr_get_ptr(p, addr), tv.type, index_count, indices);
  3337. }
  3338. auto indices = slice_make<i32>(permanent_allocator(), ce->args.count-1);
  3339. isize index_index = 0;
  3340. for (i32 i = 1; i < ce->args.count; i++) {
  3341. TypeAndValue tv = type_and_value_of_expr(ce->args[i]);
  3342. GB_ASSERT(is_type_integer(tv.type));
  3343. GB_ASSERT(tv.value.kind == ExactValue_Integer);
  3344. i64 src_index = big_int_to_i64(&tv.value.value_integer);
  3345. indices[index_index++] = cast(i32)src_index;
  3346. }
  3347. return lb_addr_swizzle_large(lb_addr_get_ptr(p, addr), tv.type, indices);
  3348. }
  3349. gb_internal lbAddr lb_build_addr_internal(lbProcedure *p, Ast *expr);
  3350. gb_internal lbAddr lb_build_addr(lbProcedure *p, Ast *expr) {
  3351. expr = unparen_expr(expr);
  3352. // IMPORTANT NOTE(bill):
  3353. // Selector Call Expressions (foo->bar(...))
  3354. // must only evaluate `foo` once as it gets transformed into
  3355. // `foo.bar(foo, ...)`
  3356. // And if `foo` is a procedure call or something more complex, storing the value
  3357. // once is a very good idea
  3358. // If a stored value is found, it must be removed from the cache
  3359. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  3360. lbAddr *pp = map_get(&p->selector_addr, expr);
  3361. if (pp != nullptr) {
  3362. lbAddr res = *pp;
  3363. map_remove(&p->selector_addr, expr);
  3364. return res;
  3365. }
  3366. }
  3367. lbAddr addr = lb_build_addr_internal(p, expr);
  3368. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  3369. map_set(&p->selector_addr, expr, addr);
  3370. }
  3371. return addr;
  3372. }
  3373. gb_internal void lb_build_addr_compound_lit_populate(lbProcedure *p, Slice<Ast *> const &elems, Array<lbCompoundLitElemTempData> *temp_data, Type *compound_type) {
  3374. Type *bt = base_type(compound_type);
  3375. Type *et = nullptr;
  3376. switch (bt->kind) {
  3377. case Type_Array: et = bt->Array.elem; break;
  3378. case Type_EnumeratedArray: et = bt->EnumeratedArray.elem; break;
  3379. case Type_Slice: et = bt->Slice.elem; break;
  3380. case Type_BitSet: et = bt->BitSet.elem; break;
  3381. case Type_DynamicArray: et = bt->DynamicArray.elem; break;
  3382. case Type_SimdVector: et = bt->SimdVector.elem; break;
  3383. case Type_Matrix: et = bt->Matrix.elem; break;
  3384. }
  3385. GB_ASSERT(et != nullptr);
  3386. // NOTE(bill): Separate value, gep, store into their own chunks
  3387. for_array(i, elems) {
  3388. Ast *elem = elems[i];
  3389. if (elem->kind == Ast_FieldValue) {
  3390. ast_node(fv, FieldValue, elem);
  3391. if (bt->kind != Type_DynamicArray && lb_is_elem_const(fv->value, et)) {
  3392. continue;
  3393. }
  3394. if (is_ast_range(fv->field)) {
  3395. ast_node(ie, BinaryExpr, fv->field);
  3396. TypeAndValue lo_tav = ie->left->tav;
  3397. TypeAndValue hi_tav = ie->right->tav;
  3398. GB_ASSERT(lo_tav.mode == Addressing_Constant);
  3399. GB_ASSERT(hi_tav.mode == Addressing_Constant);
  3400. TokenKind op = ie->op.kind;
  3401. i64 lo = exact_value_to_i64(lo_tav.value);
  3402. i64 hi = exact_value_to_i64(hi_tav.value);
  3403. if (op != Token_RangeHalf) {
  3404. hi += 1;
  3405. }
  3406. lbValue value = lb_emit_conv(p, lb_build_expr(p, fv->value), et);
  3407. GB_ASSERT((hi-lo) > 0);
  3408. if (bt->kind == Type_Matrix) {
  3409. for (i64 k = lo; k < hi; k++) {
  3410. lbCompoundLitElemTempData data = {};
  3411. data.value = value;
  3412. data.elem_index = matrix_row_major_index_to_offset(bt, k);
  3413. array_add(temp_data, data);
  3414. }
  3415. } else {
  3416. enum {MAX_ELEMENT_AMOUNT = 32};
  3417. if ((hi-lo) <= MAX_ELEMENT_AMOUNT) {
  3418. for (i64 k = lo; k < hi; k++) {
  3419. lbCompoundLitElemTempData data = {};
  3420. data.value = value;
  3421. data.elem_index = k;
  3422. array_add(temp_data, data);
  3423. }
  3424. } else {
  3425. lbCompoundLitElemTempData data = {};
  3426. data.value = value;
  3427. data.elem_index = lo;
  3428. data.elem_length = hi-lo;
  3429. array_add(temp_data, data);
  3430. }
  3431. }
  3432. } else {
  3433. auto tav = fv->field->tav;
  3434. GB_ASSERT(tav.mode == Addressing_Constant);
  3435. i64 index = exact_value_to_i64(tav.value);
  3436. lbValue value = lb_emit_conv(p, lb_build_expr(p, fv->value), et);
  3437. GB_ASSERT(!is_type_tuple(value.type));
  3438. lbCompoundLitElemTempData data = {};
  3439. data.value = value;
  3440. data.expr = fv->value;
  3441. if (bt->kind == Type_Matrix) {
  3442. data.elem_index = matrix_row_major_index_to_offset(bt, index);
  3443. } else {
  3444. data.elem_index = index;
  3445. }
  3446. array_add(temp_data, data);
  3447. }
  3448. } else {
  3449. if (bt->kind != Type_DynamicArray && lb_is_elem_const(elem, et)) {
  3450. continue;
  3451. }
  3452. lbValue field_expr = lb_build_expr(p, elem);
  3453. GB_ASSERT(!is_type_tuple(field_expr.type));
  3454. lbValue ev = lb_emit_conv(p, field_expr, et);
  3455. lbCompoundLitElemTempData data = {};
  3456. data.value = ev;
  3457. if (bt->kind == Type_Matrix) {
  3458. data.elem_index = matrix_row_major_index_to_offset(bt, i);
  3459. } else {
  3460. data.elem_index = i;
  3461. }
  3462. array_add(temp_data, data);
  3463. }
  3464. }
  3465. }
  3466. gb_internal void lb_build_addr_compound_lit_assign_array(lbProcedure *p, Array<lbCompoundLitElemTempData> const &temp_data) {
  3467. for (auto const &td : temp_data) {
  3468. if (td.value.value != nullptr) {
  3469. if (td.elem_length > 0) {
  3470. auto loop_data = lb_loop_start(p, cast(isize)td.elem_length, t_i32);
  3471. {
  3472. lbValue dst = td.gep;
  3473. dst = lb_emit_ptr_offset(p, dst, loop_data.idx);
  3474. lb_emit_store(p, dst, td.value);
  3475. }
  3476. lb_loop_end(p, loop_data);
  3477. } else {
  3478. lb_emit_store(p, td.gep, td.value);
  3479. }
  3480. }
  3481. }
  3482. }
  3483. gb_internal lbAddr lb_build_addr_index_expr(lbProcedure *p, Ast *expr) {
  3484. ast_node(ie, IndexExpr, expr);
  3485. Type *t = base_type(type_of_expr(ie->expr));
  3486. bool deref = is_type_pointer(t);
  3487. t = base_type(type_deref(t));
  3488. if (is_type_soa_struct(t)) {
  3489. // SOA STRUCTURES!!!!
  3490. lbValue val = lb_build_addr_ptr(p, ie->expr);
  3491. if (deref) {
  3492. val = lb_emit_load(p, val);
  3493. }
  3494. lbValue index = lb_build_expr(p, ie->index);
  3495. return lb_addr_soa_variable(val, index, ie->index);
  3496. }
  3497. if (ie->expr->tav.mode == Addressing_SoaVariable) {
  3498. // SOA Structures for slices/dynamic arrays
  3499. GB_ASSERT_MSG(is_type_multi_pointer(type_of_expr(ie->expr)), "%s", type_to_string(type_of_expr(ie->expr)));
  3500. lbValue field = lb_build_expr(p, ie->expr);
  3501. lbValue index = lb_build_expr(p, ie->index);
  3502. if (!build_context.no_bounds_check) {
  3503. Ast *se_expr = unparen_expr(ie->expr);
  3504. if (se_expr->kind == Ast_SelectorExpr) {
  3505. ast_node(se, SelectorExpr, se_expr);
  3506. lbValue len = {};
  3507. Type *type = base_type(type_deref(type_of_expr(se->expr)));
  3508. GB_ASSERT_MSG(is_type_soa_struct(type), "%s", type_to_string(type));
  3509. if (type->Struct.soa_kind == StructSoa_Fixed) {
  3510. len = lb_const_int(p->module, t_int, type->Struct.soa_count);
  3511. } else {
  3512. lbAddr *found = map_get(&p->selector_addr, se_expr);
  3513. if (found) {
  3514. lbAddr addr = *found;
  3515. lbValue parent = lb_addr_get_ptr(p, addr);
  3516. if (is_type_pointer(type_deref(parent.type))) {
  3517. parent = lb_emit_load(p, parent);
  3518. }
  3519. len = lb_soa_struct_len(p, parent);
  3520. }
  3521. }
  3522. if (len.value) {
  3523. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3524. }
  3525. } else {
  3526. // TODO(bill): how do you even do bounds checking here?
  3527. }
  3528. }
  3529. lbValue val = lb_emit_ptr_offset(p, field, index);
  3530. return lb_addr(val);
  3531. }
  3532. GB_ASSERT_MSG(is_type_indexable(t), "%s %s", type_to_string(t), expr_to_string(expr));
  3533. if (is_type_map(t)) {
  3534. lbAddr map_addr = lb_build_addr(p, ie->expr);
  3535. lbValue key = lb_build_expr(p, ie->index);
  3536. key = lb_emit_conv(p, key, t->Map.key);
  3537. Type *result_type = type_of_expr(expr);
  3538. lbValue map_ptr = lb_addr_get_ptr(p, map_addr);
  3539. if (is_type_pointer(type_deref(map_ptr.type))) {
  3540. map_ptr = lb_emit_load(p, map_ptr);
  3541. }
  3542. return lb_addr_map(map_ptr, key, t, result_type);
  3543. }
  3544. switch (t->kind) {
  3545. case Type_Array: {
  3546. lbValue array = {};
  3547. array = lb_build_addr_ptr(p, ie->expr);
  3548. if (deref) {
  3549. array = lb_emit_load(p, array);
  3550. }
  3551. lbValue index = lb_build_expr(p, ie->index);
  3552. index = lb_emit_conv(p, index, t_int);
  3553. lbValue elem = lb_emit_array_ep(p, array, index);
  3554. auto index_tv = type_and_value_of_expr(ie->index);
  3555. if (index_tv.mode != Addressing_Constant) {
  3556. lbValue len = lb_const_int(p->module, t_int, t->Array.count);
  3557. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3558. }
  3559. return lb_addr(elem);
  3560. }
  3561. case Type_EnumeratedArray: {
  3562. lbValue array = {};
  3563. array = lb_build_addr_ptr(p, ie->expr);
  3564. if (deref) {
  3565. array = lb_emit_load(p, array);
  3566. }
  3567. Type *index_type = t->EnumeratedArray.index;
  3568. auto index_tv = type_and_value_of_expr(ie->index);
  3569. lbValue index = {};
  3570. if (compare_exact_values(Token_NotEq, *t->EnumeratedArray.min_value, exact_value_i64(0))) {
  3571. if (index_tv.mode == Addressing_Constant) {
  3572. ExactValue idx = exact_value_sub(index_tv.value, *t->EnumeratedArray.min_value);
  3573. index = lb_const_value(p->module, index_type, idx);
  3574. } else {
  3575. index = lb_emit_arith(p, Token_Sub,
  3576. lb_build_expr(p, ie->index),
  3577. lb_const_value(p->module, index_type, *t->EnumeratedArray.min_value),
  3578. index_type);
  3579. index = lb_emit_conv(p, index, t_int);
  3580. }
  3581. } else {
  3582. index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3583. }
  3584. lbValue elem = lb_emit_array_ep(p, array, index);
  3585. if (index_tv.mode != Addressing_Constant) {
  3586. lbValue len = lb_const_int(p->module, t_int, t->EnumeratedArray.count);
  3587. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3588. }
  3589. return lb_addr(elem);
  3590. }
  3591. case Type_Slice: {
  3592. lbValue slice = {};
  3593. slice = lb_build_expr(p, ie->expr);
  3594. if (deref) {
  3595. slice = lb_emit_load(p, slice);
  3596. }
  3597. lbValue elem = lb_slice_elem(p, slice);
  3598. lbValue index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3599. lbValue len = lb_slice_len(p, slice);
  3600. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3601. lbValue v = lb_emit_ptr_offset(p, elem, index);
  3602. return lb_addr(v);
  3603. }
  3604. case Type_MultiPointer: {
  3605. lbValue multi_ptr = {};
  3606. multi_ptr = lb_build_expr(p, ie->expr);
  3607. if (deref) {
  3608. multi_ptr = lb_emit_load(p, multi_ptr);
  3609. }
  3610. lbValue index = lb_build_expr(p, ie->index);
  3611. index = lb_emit_conv(p, index, t_int);
  3612. lbValue v = {};
  3613. LLVMValueRef indices[1] = {index.value};
  3614. v.value = LLVMBuildGEP2(p->builder, lb_type(p->module, t->MultiPointer.elem), multi_ptr.value, indices, 1, "");
  3615. v.type = alloc_type_pointer(t->MultiPointer.elem);
  3616. return lb_addr(v);
  3617. }
  3618. case Type_DynamicArray: {
  3619. lbValue dynamic_array = {};
  3620. dynamic_array = lb_build_expr(p, ie->expr);
  3621. if (deref) {
  3622. dynamic_array = lb_emit_load(p, dynamic_array);
  3623. }
  3624. lbValue elem = lb_dynamic_array_elem(p, dynamic_array);
  3625. lbValue len = lb_dynamic_array_len(p, dynamic_array);
  3626. lbValue index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3627. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3628. lbValue v = lb_emit_ptr_offset(p, elem, index);
  3629. return lb_addr(v);
  3630. }
  3631. case Type_Matrix: {
  3632. lbValue matrix = {};
  3633. matrix = lb_build_addr_ptr(p, ie->expr);
  3634. if (deref) {
  3635. matrix = lb_emit_load(p, matrix);
  3636. }
  3637. lbValue index = lb_build_expr(p, ie->index);
  3638. index = lb_emit_conv(p, index, t_int);
  3639. isize bounds_len = 0;
  3640. lbValue elem = {};
  3641. if (t->Matrix.is_row_major) {
  3642. bounds_len = t->Matrix.row_count;
  3643. elem = lb_emit_matrix_ep(p, matrix, index, lb_const_int(p->module, t_int, 0));
  3644. } else {
  3645. bounds_len = t->Matrix.column_count;
  3646. elem = lb_emit_matrix_ep(p, matrix, lb_const_int(p->module, t_int, 0), index);
  3647. }
  3648. elem = lb_emit_conv(p, elem, alloc_type_pointer(type_of_expr(expr)));
  3649. auto index_tv = type_and_value_of_expr(ie->index);
  3650. if (index_tv.mode != Addressing_Constant) {
  3651. lbValue len = lb_const_int(p->module, t_int, bounds_len);
  3652. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3653. }
  3654. return lb_addr(elem);
  3655. }
  3656. case Type_Basic: { // Basic_string
  3657. lbValue str;
  3658. lbValue elem;
  3659. lbValue len;
  3660. lbValue index;
  3661. str = lb_build_expr(p, ie->expr);
  3662. if (deref) {
  3663. str = lb_emit_load(p, str);
  3664. }
  3665. elem = lb_string_elem(p, str);
  3666. len = lb_string_len(p, str);
  3667. index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3668. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3669. return lb_addr(lb_emit_ptr_offset(p, elem, index));
  3670. }
  3671. }
  3672. return {};
  3673. }
  3674. gb_internal lbAddr lb_build_addr_slice_expr(lbProcedure *p, Ast *expr) {
  3675. ast_node(se, SliceExpr, expr);
  3676. lbAddr addr = lb_build_addr(p, se->expr);
  3677. lbValue base = lb_addr_load(p, addr);
  3678. Type *type = base_type(base.type);
  3679. if (is_type_pointer(type)) {
  3680. type = base_type(type_deref(type));
  3681. addr = lb_addr(base);
  3682. base = lb_addr_load(p, addr);
  3683. }
  3684. lbValue low = lb_const_int(p->module, t_int, 0);
  3685. lbValue high = {};
  3686. if (se->low != nullptr) {
  3687. low = lb_correct_endianness(p, lb_build_expr(p, se->low));
  3688. }
  3689. if (se->high != nullptr) {
  3690. high = lb_correct_endianness(p, lb_build_expr(p, se->high));
  3691. }
  3692. bool no_indices = se->low == nullptr && se->high == nullptr;
  3693. switch (type->kind) {
  3694. case Type_Slice: {
  3695. Type *slice_type = type;
  3696. lbValue len = lb_slice_len(p, base);
  3697. if (high.value == nullptr) high = len;
  3698. if (!no_indices) {
  3699. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3700. }
  3701. lbValue elem = lb_emit_ptr_offset(p, lb_slice_elem(p, base), low);
  3702. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3703. lbAddr slice = lb_add_local_generated(p, slice_type, false);
  3704. lb_fill_slice(p, slice, elem, new_len);
  3705. return slice;
  3706. }
  3707. case Type_DynamicArray: {
  3708. Type *elem_type = type->DynamicArray.elem;
  3709. Type *slice_type = alloc_type_slice(elem_type);
  3710. lbValue len = lb_dynamic_array_len(p, base);
  3711. if (high.value == nullptr) high = len;
  3712. if (!no_indices) {
  3713. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3714. }
  3715. lbValue elem = lb_emit_ptr_offset(p, lb_dynamic_array_elem(p, base), low);
  3716. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3717. lbAddr slice = lb_add_local_generated(p, slice_type, false);
  3718. lb_fill_slice(p, slice, elem, new_len);
  3719. return slice;
  3720. }
  3721. case Type_MultiPointer: {
  3722. lbAddr res = lb_add_local_generated(p, type_of_expr(expr), false);
  3723. if (se->high == nullptr) {
  3724. lbValue offset = base;
  3725. LLVMValueRef indices[1] = {low.value};
  3726. offset.value = LLVMBuildGEP2(p->builder, lb_type(p->module, base_type(offset.type)->MultiPointer.elem), offset.value, indices, 1, "");
  3727. lb_addr_store(p, res, offset);
  3728. } else {
  3729. low = lb_emit_conv(p, low, t_int);
  3730. high = lb_emit_conv(p, high, t_int);
  3731. lb_emit_multi_pointer_slice_bounds_check(p, se->open, low, high);
  3732. LLVMValueRef indices[1] = {low.value};
  3733. LLVMValueRef ptr = LLVMBuildGEP2(p->builder, lb_type(p->module, base_type(base.type)->MultiPointer.elem), base.value, indices, 1, "");
  3734. LLVMValueRef len = LLVMBuildSub(p->builder, high.value, low.value, "");
  3735. LLVMValueRef gep0 = lb_emit_struct_ep(p, res.addr, 0).value;
  3736. LLVMValueRef gep1 = lb_emit_struct_ep(p, res.addr, 1).value;
  3737. LLVMBuildStore(p->builder, ptr, gep0);
  3738. LLVMBuildStore(p->builder, len, gep1);
  3739. }
  3740. return res;
  3741. }
  3742. case Type_Array: {
  3743. Type *slice_type = alloc_type_slice(type->Array.elem);
  3744. lbValue len = lb_const_int(p->module, t_int, type->Array.count);
  3745. if (high.value == nullptr) high = len;
  3746. bool low_const = type_and_value_of_expr(se->low).mode == Addressing_Constant;
  3747. bool high_const = type_and_value_of_expr(se->high).mode == Addressing_Constant;
  3748. if (!low_const || !high_const) {
  3749. if (!no_indices) {
  3750. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3751. }
  3752. }
  3753. lbValue elem = lb_emit_ptr_offset(p, lb_array_elem(p, lb_addr_get_ptr(p, addr)), low);
  3754. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3755. lbAddr slice = lb_add_local_generated(p, slice_type, false);
  3756. lb_fill_slice(p, slice, elem, new_len);
  3757. return slice;
  3758. }
  3759. case Type_Basic: {
  3760. GB_ASSERT_MSG(are_types_identical(type, t_string), "got %s", type_to_string(type));
  3761. lbValue len = lb_string_len(p, base);
  3762. if (high.value == nullptr) high = len;
  3763. if (!no_indices) {
  3764. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3765. }
  3766. lbValue elem = lb_emit_ptr_offset(p, lb_string_elem(p, base), low);
  3767. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3768. lbAddr str = lb_add_local_generated(p, t_string, false);
  3769. lb_fill_string(p, str, elem, new_len);
  3770. return str;
  3771. }
  3772. case Type_Struct:
  3773. if (is_type_soa_struct(type)) {
  3774. lbValue len = lb_soa_struct_len(p, lb_addr_get_ptr(p, addr));
  3775. if (high.value == nullptr) high = len;
  3776. if (!no_indices) {
  3777. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3778. }
  3779. #if 1
  3780. lbAddr dst = lb_add_local_generated(p, type_of_expr(expr), true);
  3781. if (type->Struct.soa_kind == StructSoa_Fixed) {
  3782. i32 field_count = cast(i32)type->Struct.fields.count;
  3783. for (i32 i = 0; i < field_count; i++) {
  3784. lbValue field_dst = lb_emit_struct_ep(p, dst.addr, i);
  3785. lbValue field_src = lb_emit_struct_ep(p, lb_addr_get_ptr(p, addr), i);
  3786. field_src = lb_emit_array_ep(p, field_src, low);
  3787. field_src = lb_emit_conv(p, field_src, type_deref(field_dst.type));
  3788. lb_emit_store(p, field_dst, field_src);
  3789. }
  3790. lbValue len_dst = lb_emit_struct_ep(p, dst.addr, field_count);
  3791. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3792. lb_emit_store(p, len_dst, new_len);
  3793. } else if (type->Struct.soa_kind == StructSoa_Slice) {
  3794. if (no_indices) {
  3795. lb_addr_store(p, dst, base);
  3796. } else {
  3797. i32 field_count = cast(i32)type->Struct.fields.count - 1;
  3798. for (i32 i = 0; i < field_count; i++) {
  3799. lbValue field_dst = lb_emit_struct_ep(p, dst.addr, i);
  3800. lbValue field_src = lb_emit_struct_ev(p, base, i);
  3801. field_src = lb_emit_ptr_offset(p, field_src, low);
  3802. field_src = lb_emit_conv(p, field_src, type_deref(field_dst.type));
  3803. lb_emit_store(p, field_dst, field_src);
  3804. }
  3805. lbValue len_dst = lb_emit_struct_ep(p, dst.addr, field_count);
  3806. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3807. lb_emit_store(p, len_dst, new_len);
  3808. }
  3809. } else if (type->Struct.soa_kind == StructSoa_Dynamic) {
  3810. i32 field_count = cast(i32)type->Struct.fields.count - 3;
  3811. for (i32 i = 0; i < field_count; i++) {
  3812. lbValue field_dst = lb_emit_struct_ep(p, dst.addr, i);
  3813. lbValue field_src = lb_emit_struct_ev(p, base, i);
  3814. field_src = lb_emit_ptr_offset(p, field_src, low);
  3815. field_src = lb_emit_conv(p, field_src, type_deref(field_dst.type));
  3816. lb_emit_store(p, field_dst, field_src);
  3817. }
  3818. lbValue len_dst = lb_emit_struct_ep(p, dst.addr, field_count);
  3819. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3820. lb_emit_store(p, len_dst, new_len);
  3821. }
  3822. return dst;
  3823. #endif
  3824. }
  3825. break;
  3826. }
  3827. GB_PANIC("Unknown slicable type");
  3828. return {};
  3829. }
  3830. gb_internal lbAddr lb_build_addr_compound_lit(lbProcedure *p, Ast *expr) {
  3831. ast_node(cl, CompoundLit, expr);
  3832. Type *type = type_of_expr(expr);
  3833. Type *bt = base_type(type);
  3834. lbAddr v = lb_add_local_generated(p, type, true);
  3835. TEMPORARY_ALLOCATOR_GUARD();
  3836. Type *et = nullptr;
  3837. switch (bt->kind) {
  3838. case Type_Array: et = bt->Array.elem; break;
  3839. case Type_EnumeratedArray: et = bt->EnumeratedArray.elem; break;
  3840. case Type_Slice: et = bt->Slice.elem; break;
  3841. case Type_BitSet: et = bt->BitSet.elem; break;
  3842. case Type_SimdVector: et = bt->SimdVector.elem; break;
  3843. case Type_Matrix: et = bt->Matrix.elem; break;
  3844. }
  3845. String proc_name = {};
  3846. if (p->entity) {
  3847. proc_name = p->entity->token.string;
  3848. }
  3849. TokenPos pos = ast_token(expr).pos;
  3850. switch (bt->kind) {
  3851. default: GB_PANIC("Unknown CompoundLit type: %s", type_to_string(type)); break;
  3852. case Type_BitField: {
  3853. TEMPORARY_ALLOCATOR_GUARD();
  3854. // Type *backing_type = core_type(bt->BitField.backing_type);
  3855. struct FieldData {
  3856. Type *field_type;
  3857. u64 bit_offset;
  3858. u64 bit_size;
  3859. };
  3860. auto values = array_make<lbValue>(temporary_allocator(), 0, cl->elems.count);
  3861. auto fields = array_make<FieldData>(temporary_allocator(), 0, cl->elems.count);
  3862. for (Ast *elem : cl->elems) {
  3863. ast_node(fv, FieldValue, elem);
  3864. String name = fv->field->Ident.token.string;
  3865. Selection sel = lookup_field(bt, name, false);
  3866. GB_ASSERT(sel.is_bit_field);
  3867. GB_ASSERT(!sel.indirect);
  3868. GB_ASSERT(sel.index.count == 1);
  3869. GB_ASSERT(sel.entity != nullptr);
  3870. i64 index = sel.index[0];
  3871. Entity *f = bt->BitField.fields[index];
  3872. GB_ASSERT(f == sel.entity);
  3873. i64 bit_offset = bt->BitField.bit_offsets[index];
  3874. i64 bit_size = bt->BitField.bit_sizes[index];
  3875. GB_ASSERT(bit_size > 0);
  3876. Type *field_type = sel.entity->type;
  3877. lbValue field_expr = lb_build_expr(p, fv->value);
  3878. field_expr = lb_emit_conv(p, field_expr, field_type);
  3879. array_add(&values, field_expr);
  3880. array_add(&fields, FieldData{field_type, cast(u64)bit_offset, cast(u64)bit_size});
  3881. }
  3882. // NOTE(bill): inline insertion sort should be good enough, right?
  3883. for (isize i = 1; i < values.count; i++) {
  3884. for (isize j = i;
  3885. j > 0 && fields[i].bit_offset < fields[j].bit_offset;
  3886. j--) {
  3887. auto vtmp = values[j];
  3888. values[j] = values[j-1];
  3889. values[j-1] = vtmp;
  3890. auto ftmp = fields[j];
  3891. fields[j] = fields[j-1];
  3892. fields[j-1] = ftmp;
  3893. }
  3894. }
  3895. bool any_fields_different_endian = false;
  3896. for (auto const &f : fields) {
  3897. if (is_type_different_to_arch_endianness(f.field_type)) {
  3898. // NOTE(bill): Just be slow for this, to be correct
  3899. any_fields_different_endian = true;
  3900. break;
  3901. }
  3902. }
  3903. if (!any_fields_different_endian &&
  3904. fields.count == bt->BitField.fields.count) {
  3905. // SINGLE INTEGER BACKING ONLY
  3906. Type *backing_type = core_type(bt->BitField.backing_type);
  3907. GB_ASSERT(is_type_integer(backing_type) ||
  3908. (is_type_array(backing_type) && is_type_integer(backing_type->Array.elem)));
  3909. // NOTE(bill): all fields are present
  3910. // this means no masking is necessary since on write, the bits will be overridden
  3911. lbValue dst_byte_ptr = lb_emit_conv(p, v.addr, t_u8_ptr);
  3912. u64 total_bit_size = cast(u64)(8*type_size_of(bt));
  3913. if (is_type_integer(backing_type)) {
  3914. LLVMTypeRef lit = lb_type(p->module, backing_type);
  3915. LLVMValueRef res = LLVMConstInt(lit, 0, false);
  3916. for (isize i = 0; i < fields.count; i++) {
  3917. auto const &f = fields[i];
  3918. LLVMValueRef mask = LLVMConstInt(lit, 1, false);
  3919. #if LLVM_VERSION_MAJOR >= 19
  3920. mask = LLVMBuildShl(p->builder, mask, LLVMConstInt(lit, f.bit_size, false), "");
  3921. #else
  3922. mask = LLVMConstShl(mask, LLVMConstInt(lit, f.bit_size, false));
  3923. #endif
  3924. mask = LLVMConstSub(mask, LLVMConstInt(lit, 1, false));
  3925. LLVMValueRef elem = values[i].value;
  3926. if (lb_sizeof(lit) < lb_sizeof(LLVMTypeOf(elem))) {
  3927. elem = LLVMBuildTrunc(p->builder, elem, lit, "");
  3928. } else {
  3929. elem = LLVMBuildZExt(p->builder, elem, lit, "");
  3930. }
  3931. elem = LLVMBuildAnd(p->builder, elem, mask, "");
  3932. elem = LLVMBuildShl(p->builder, elem, LLVMConstInt(lit, f.bit_offset, false), "");
  3933. res = LLVMBuildOr(p->builder, res, elem, "");
  3934. }
  3935. LLVMBuildStore(p->builder, res, v.addr.value);
  3936. } else if (is_type_array(backing_type)) {
  3937. // ARRAY OF INTEGER BACKING
  3938. i64 array_count = backing_type->Array.count;
  3939. LLVMTypeRef lit = lb_type(p->module, core_type(backing_type->Array.elem));
  3940. gb_unused(array_count);
  3941. gb_unused(lit);
  3942. LLVMValueRef *elems = gb_alloc_array(temporary_allocator(), LLVMValueRef, array_count);
  3943. for (i64 i = 0; i < array_count; i++) {
  3944. elems[i] = LLVMConstInt(lit, 0, false);
  3945. }
  3946. u64 elem_bit_size = cast(u64)(8*type_size_of(backing_type->Array.elem));
  3947. u64 curr_bit_offset = 0;
  3948. for (isize i = 0; i < fields.count; i++) {
  3949. auto const &f = fields[i];
  3950. LLVMValueRef val = values[i].value;
  3951. LLVMTypeRef vt = lb_type(p->module, values[i].type);
  3952. for (u64 bits_to_set = f.bit_size;
  3953. bits_to_set > 0;
  3954. /**/) {
  3955. i64 elem_idx = curr_bit_offset/elem_bit_size;
  3956. u64 elem_bit_offset = curr_bit_offset%elem_bit_size;
  3957. u64 mask_width = gb_min(bits_to_set, elem_bit_size-elem_bit_offset);
  3958. GB_ASSERT(mask_width > 0);
  3959. bits_to_set -= mask_width;
  3960. LLVMValueRef mask = LLVMConstInt(vt, 1, false);
  3961. #if LLVM_VERSION_MAJOR >= 19
  3962. mask = LLVMBuildShl(p->builder, mask, LLVMConstInt(vt, mask_width, false), "");
  3963. #else
  3964. mask = LLVMConstShl(mask, LLVMConstInt(vt, mask_width, false));
  3965. #endif
  3966. mask = LLVMConstSub(mask, LLVMConstInt(vt, 1, false));
  3967. LLVMValueRef to_set = LLVMBuildAnd(p->builder, val, mask, "");
  3968. if (elem_bit_offset != 0) {
  3969. to_set = LLVMBuildShl(p->builder, to_set, LLVMConstInt(vt, elem_bit_offset, false), "");
  3970. }
  3971. to_set = LLVMBuildTrunc(p->builder, to_set, lit, "");
  3972. if (LLVMIsNull(elems[elem_idx])) {
  3973. elems[elem_idx] = to_set; // don't even bother doing `0 | to_set`
  3974. } else {
  3975. elems[elem_idx] = LLVMBuildOr(p->builder, elems[elem_idx], to_set, "");
  3976. }
  3977. if (mask_width != 0) {
  3978. val = LLVMBuildLShr(p->builder, val, LLVMConstInt(vt, mask_width, false), "");
  3979. }
  3980. curr_bit_offset += mask_width;
  3981. }
  3982. GB_ASSERT(curr_bit_offset == f.bit_offset + f.bit_size);
  3983. }
  3984. for (i64 i = 0; i < array_count; i++) {
  3985. LLVMValueRef elem_ptr = LLVMBuildStructGEP2(p->builder, lb_type(p->module, backing_type), v.addr.value, cast(unsigned)i, "");
  3986. LLVMBuildStore(p->builder, elems[i], elem_ptr);
  3987. }
  3988. } else {
  3989. // SLOW STORAGE
  3990. for_array(i, fields) {
  3991. auto const &f = fields[i];
  3992. if ((f.bit_offset & 7) == 0) {
  3993. u64 unpacked_bit_size = cast(u64)(8*type_size_of(f.field_type));
  3994. u64 byte_size = (f.bit_size+7)/8;
  3995. if (f.bit_offset + unpacked_bit_size <= total_bit_size) {
  3996. byte_size = unpacked_bit_size/8;
  3997. }
  3998. lbValue dst = lb_emit_ptr_offset(p, dst_byte_ptr, lb_const_int(p->module, t_int, f.bit_offset/8));
  3999. lbValue src = lb_address_from_load_or_generate_local(p, values[i]);
  4000. lb_mem_copy_non_overlapping(p, dst, src, lb_const_int(p->module, t_uintptr, byte_size));
  4001. } else {
  4002. lbAddr dst = lb_addr_bit_field(v.addr, f.field_type, f.bit_offset, f.bit_size);
  4003. lb_addr_store(p, dst, values[i]);
  4004. }
  4005. }
  4006. }
  4007. } else {
  4008. // individual storing
  4009. for_array(i, values) {
  4010. auto const &f = fields[i];
  4011. lbAddr dst = lb_addr_bit_field(v.addr, f.field_type, f.bit_offset, f.bit_size);
  4012. lb_addr_store(p, dst, values[i]);
  4013. }
  4014. }
  4015. return v;
  4016. }
  4017. case Type_Struct: {
  4018. // TODO(bill): "constant" '#raw_union's are not initialized constantly at the moment.
  4019. // NOTE(bill): This is due to the layout of the unions when printed to LLVM-IR
  4020. bool is_raw_union = is_type_raw_union(bt);
  4021. GB_ASSERT(is_type_struct(bt) || is_raw_union);
  4022. TypeStruct *st = &bt->Struct;
  4023. if (cl->elems.count > 0) {
  4024. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4025. lbValue comp_lit_ptr = lb_addr_get_ptr(p, v);
  4026. for_array(field_index, cl->elems) {
  4027. Ast *elem = cl->elems[field_index];
  4028. lbValue field_expr = {};
  4029. Entity *field = nullptr;
  4030. isize index = field_index;
  4031. if (elem->kind == Ast_FieldValue) {
  4032. ast_node(fv, FieldValue, elem);
  4033. String name = fv->field->Ident.token.string;
  4034. Selection sel = lookup_field(bt, name, false);
  4035. GB_ASSERT(!sel.indirect);
  4036. elem = fv->value;
  4037. if (sel.index.count > 1) {
  4038. if (lb_is_nested_possibly_constant(type, sel, elem)) {
  4039. continue;
  4040. }
  4041. field_expr = lb_build_expr(p, elem);
  4042. field_expr = lb_emit_conv(p, field_expr, sel.entity->type);
  4043. if (sel.is_bit_field) {
  4044. Selection sub_sel = trim_selection(sel);
  4045. lbValue trimmed_dst = lb_emit_deep_field_gep(p, comp_lit_ptr, sub_sel);
  4046. Type *bf = base_type(type_deref(trimmed_dst.type));
  4047. if (is_type_pointer(bf)) {
  4048. trimmed_dst = lb_emit_load(p, trimmed_dst);
  4049. bf = base_type(type_deref(trimmed_dst.type));
  4050. }
  4051. GB_ASSERT(bf->kind == Type_BitField);
  4052. isize idx = sel.index[sel.index.count-1];
  4053. lbAddr dst = lb_addr_bit_field(trimmed_dst, bf->BitField.fields[idx]->type, bf->BitField.bit_offsets[idx], bf->BitField.bit_sizes[idx]);
  4054. lb_addr_store(p, dst, field_expr);
  4055. } else {
  4056. lbValue dst = lb_emit_deep_field_gep(p, comp_lit_ptr, sel);
  4057. lb_emit_store(p, dst, field_expr);
  4058. }
  4059. continue;
  4060. }
  4061. index = sel.index[0];
  4062. } else {
  4063. Selection sel = lookup_field_from_index(bt, st->fields[field_index]->Variable.field_index);
  4064. GB_ASSERT(sel.index.count == 1);
  4065. GB_ASSERT(!sel.indirect);
  4066. index = sel.index[0];
  4067. }
  4068. field = st->fields[index];
  4069. Type *ft = field->type;
  4070. if (!is_raw_union && !is_type_typeid(ft) && lb_is_elem_const(elem, ft)) {
  4071. continue;
  4072. }
  4073. field_expr = lb_build_expr(p, elem);
  4074. lbValue gep = {};
  4075. if (is_raw_union) {
  4076. gep = lb_emit_conv(p, comp_lit_ptr, alloc_type_pointer(ft));
  4077. } else {
  4078. gep = lb_emit_struct_ep(p, comp_lit_ptr, cast(i32)index);
  4079. }
  4080. Type *fet = field_expr.type;
  4081. GB_ASSERT(fet->kind != Type_Tuple);
  4082. // HACK TODO(bill): THIS IS A MASSIVE HACK!!!!
  4083. if (is_type_union(ft) && !are_types_identical(fet, ft) && !is_type_untyped(fet)) {
  4084. GB_ASSERT_MSG(union_variant_index(ft, fet) >= 0, "%s", type_to_string(fet));
  4085. lb_emit_store_union_variant(p, gep, field_expr, fet);
  4086. } else {
  4087. lbValue fv = lb_emit_conv(p, field_expr, ft);
  4088. lb_emit_store(p, gep, fv);
  4089. }
  4090. }
  4091. }
  4092. break;
  4093. }
  4094. case Type_Map: {
  4095. if (cl->elems.count == 0) {
  4096. break;
  4097. }
  4098. GB_ASSERT(expr->file()->feature_flags & OptInFeatureFlag_DynamicLiterals);
  4099. lbValue err = lb_dynamic_map_reserve(p, v.addr, 2*cl->elems.count, pos);
  4100. gb_unused(err);
  4101. for (Ast *elem : cl->elems) {
  4102. ast_node(fv, FieldValue, elem);
  4103. lbValue key = lb_build_expr(p, fv->field);
  4104. lbValue value = lb_build_expr(p, fv->value);
  4105. lb_internal_dynamic_map_set(p, v.addr, type, key, value, elem);
  4106. }
  4107. break;
  4108. }
  4109. case Type_Array: {
  4110. if (cl->elems.count > 0) {
  4111. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4112. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4113. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4114. lbValue dst_ptr = lb_addr_get_ptr(p, v);
  4115. for_array(i, temp_data) {
  4116. i32 index = cast(i32)(temp_data[i].elem_index);
  4117. temp_data[i].gep = lb_emit_array_epi(p, dst_ptr, index);
  4118. }
  4119. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4120. }
  4121. break;
  4122. }
  4123. case Type_EnumeratedArray: {
  4124. if (cl->elems.count > 0) {
  4125. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4126. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4127. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4128. lbValue dst_ptr = lb_addr_get_ptr(p, v);
  4129. i64 index_offset = exact_value_to_i64(*bt->EnumeratedArray.min_value);
  4130. for_array(i, temp_data) {
  4131. i32 index = cast(i32)(temp_data[i].elem_index - index_offset);
  4132. temp_data[i].gep = lb_emit_array_epi(p, dst_ptr, index);
  4133. }
  4134. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4135. }
  4136. break;
  4137. }
  4138. case Type_Slice: {
  4139. if (cl->elems.count > 0) {
  4140. lbValue slice = lb_const_value(p->module, type, exact_value_compound(expr));
  4141. lbValue data = lb_slice_elem(p, slice);
  4142. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4143. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4144. for_array(i, temp_data) {
  4145. temp_data[i].gep = lb_emit_ptr_offset(p, data, lb_const_int(p->module, t_int, temp_data[i].elem_index));
  4146. }
  4147. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4148. {
  4149. lbValue count = {};
  4150. count.type = t_int;
  4151. unsigned len_index = lb_convert_struct_index(p->module, type, 1);
  4152. if (lb_is_const(slice)) {
  4153. unsigned indices[1] = {len_index};
  4154. count.value = llvm_const_extract_value(p->module, slice.value, indices, gb_count_of(indices));
  4155. } else {
  4156. count.value = LLVMBuildExtractValue(p->builder, slice.value, len_index, "");
  4157. }
  4158. lb_fill_slice(p, v, data, count);
  4159. }
  4160. }
  4161. break;
  4162. }
  4163. case Type_DynamicArray: {
  4164. if (cl->elems.count == 0) {
  4165. break;
  4166. }
  4167. GB_ASSERT(expr->file()->feature_flags & OptInFeatureFlag_DynamicLiterals);
  4168. Type *et = bt->DynamicArray.elem;
  4169. lbValue size = lb_const_int(p->module, t_int, type_size_of(et));
  4170. lbValue align = lb_const_int(p->module, t_int, type_align_of(et));
  4171. i64 item_count = gb_max(cl->max_count, cl->elems.count);
  4172. {
  4173. auto args = array_make<lbValue>(temporary_allocator(), 5);
  4174. args[0] = lb_emit_conv(p, lb_addr_get_ptr(p, v), t_rawptr);
  4175. args[1] = size;
  4176. args[2] = align;
  4177. args[3] = lb_const_int(p->module, t_int, item_count);
  4178. args[4] = lb_emit_source_code_location_as_global(p, proc_name, pos);
  4179. lb_emit_runtime_call(p, "__dynamic_array_reserve", args);
  4180. }
  4181. lbValue items = lb_generate_local_array(p, et, item_count);
  4182. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4183. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4184. for_array(i, temp_data) {
  4185. temp_data[i].gep = lb_emit_array_epi(p, items, temp_data[i].elem_index);
  4186. }
  4187. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4188. {
  4189. auto args = array_make<lbValue>(temporary_allocator(), 6);
  4190. args[0] = lb_emit_conv(p, v.addr, t_rawptr);
  4191. args[1] = size;
  4192. args[2] = align;
  4193. args[3] = lb_emit_conv(p, items, t_rawptr);
  4194. args[4] = lb_const_int(p->module, t_int, item_count);
  4195. args[5] = lb_emit_source_code_location_as_global(p, proc_name, pos);
  4196. lb_emit_runtime_call(p, "__dynamic_array_append", args);
  4197. }
  4198. break;
  4199. }
  4200. case Type_Basic: {
  4201. GB_ASSERT(is_type_any(bt));
  4202. if (cl->elems.count > 0) {
  4203. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4204. String field_names[2] = {
  4205. str_lit("data"),
  4206. str_lit("id"),
  4207. };
  4208. Type *field_types[2] = {
  4209. t_rawptr,
  4210. t_typeid,
  4211. };
  4212. for_array(field_index, cl->elems) {
  4213. Ast *elem = cl->elems[field_index];
  4214. lbValue field_expr = {};
  4215. isize index = field_index;
  4216. if (elem->kind == Ast_FieldValue) {
  4217. ast_node(fv, FieldValue, elem);
  4218. Selection sel = lookup_field(bt, fv->field->Ident.token.string, false);
  4219. index = sel.index[0];
  4220. elem = fv->value;
  4221. } else {
  4222. TypeAndValue tav = type_and_value_of_expr(elem);
  4223. Selection sel = lookup_field(bt, field_names[field_index], false);
  4224. index = sel.index[0];
  4225. }
  4226. field_expr = lb_build_expr(p, elem);
  4227. GB_ASSERT(field_expr.type->kind != Type_Tuple);
  4228. Type *ft = field_types[index];
  4229. lbValue fv = lb_emit_conv(p, field_expr, ft);
  4230. lbValue gep = lb_emit_struct_ep(p, lb_addr_get_ptr(p, v), cast(i32)index);
  4231. lb_emit_store(p, gep, fv);
  4232. }
  4233. }
  4234. break;
  4235. }
  4236. case Type_BitSet: {
  4237. i64 sz = type_size_of(type);
  4238. if (cl->elems.count > 0 && sz > 0) {
  4239. lbValue lower = lb_const_value(p->module, t_int, exact_value_i64(bt->BitSet.lower));
  4240. Type *backing = bit_set_to_int(type);
  4241. if (is_type_array(backing)) {
  4242. GB_PANIC("TODO: bit_set [N]T");
  4243. Type *base_it = core_array_type(backing);
  4244. i64 bits_per_elem = 8*type_size_of(base_it);
  4245. gb_unused(bits_per_elem);
  4246. lbValue one = lb_const_value(p->module, t_i64, exact_value_i64(1));
  4247. for (Ast *elem : cl->elems) {
  4248. GB_ASSERT(elem->kind != Ast_FieldValue);
  4249. lbValue expr = lb_build_expr(p, elem);
  4250. GB_ASSERT(expr.type->kind != Type_Tuple);
  4251. lbValue e = lb_emit_conv(p, expr, t_i64);
  4252. e = lb_emit_arith(p, Token_Sub, e, lower, t_i64);
  4253. // lbValue idx = lb_emit_arith(p, Token_Div, e, bits_per_elem, t_i64);
  4254. // lbValue val = lb_emit_arith(p, Token_Div, e, bits_per_elem, t_i64);
  4255. }
  4256. } else {
  4257. Type *it = bit_set_to_int(bt);
  4258. lbValue one = lb_const_value(p->module, it, exact_value_i64(1));
  4259. for (Ast *elem : cl->elems) {
  4260. GB_ASSERT(elem->kind != Ast_FieldValue);
  4261. lbValue expr = lb_build_expr(p, elem);
  4262. GB_ASSERT(expr.type->kind != Type_Tuple);
  4263. lbValue e = lb_emit_conv(p, expr, it);
  4264. e = lb_emit_arith(p, Token_Sub, e, lower, it);
  4265. e = lb_emit_arith(p, Token_Shl, one, e, it);
  4266. lbValue old_value = lb_emit_transmute(p, lb_addr_load(p, v), it);
  4267. lbValue new_value = lb_emit_arith(p, Token_Or, old_value, e, it);
  4268. new_value = lb_emit_transmute(p, new_value, type);
  4269. lb_addr_store(p, v, new_value);
  4270. }
  4271. }
  4272. }
  4273. break;
  4274. }
  4275. case Type_Matrix: {
  4276. if (cl->elems.count > 0) {
  4277. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4278. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4279. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4280. lbValue dst_ptr = lb_addr_get_ptr(p, v);
  4281. for_array(i, temp_data) {
  4282. temp_data[i].gep = lb_emit_array_epi(p, dst_ptr, temp_data[i].elem_index);
  4283. }
  4284. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4285. }
  4286. break;
  4287. }
  4288. case Type_SimdVector: {
  4289. if (cl->elems.count > 0) {
  4290. lbValue vector_value = lb_const_value(p->module, type, exact_value_compound(expr));
  4291. defer (lb_addr_store(p, v, vector_value));
  4292. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4293. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4294. // TODO(bill): reduce the need for individual `insertelement` if a `shufflevector`
  4295. // might be a better option
  4296. for (auto const &td : temp_data) {
  4297. if (td.value.value != nullptr) {
  4298. if (td.elem_length > 0) {
  4299. for (i64 k = 0; k < td.elem_length; k++) {
  4300. LLVMValueRef index = lb_const_int(p->module, t_u32, td.elem_index + k).value;
  4301. vector_value.value = LLVMBuildInsertElement(p->builder, vector_value.value, td.value.value, index, "");
  4302. }
  4303. } else {
  4304. LLVMValueRef index = lb_const_int(p->module, t_u32, td.elem_index).value;
  4305. vector_value.value = LLVMBuildInsertElement(p->builder, vector_value.value, td.value.value, index, "");
  4306. }
  4307. }
  4308. }
  4309. }
  4310. break;
  4311. }
  4312. }
  4313. return v;
  4314. }
  4315. gb_internal lbAddr lb_build_addr_internal(lbProcedure *p, Ast *expr) {
  4316. switch (expr->kind) {
  4317. case_ast_node(i, Implicit, expr);
  4318. lbAddr v = {};
  4319. switch (i->kind) {
  4320. case Token_context:
  4321. v = lb_find_or_generate_context_ptr(p);
  4322. break;
  4323. }
  4324. GB_ASSERT(v.addr.value != nullptr);
  4325. return v;
  4326. case_end;
  4327. case_ast_node(i, Ident, expr);
  4328. if (is_blank_ident(expr)) {
  4329. lbAddr val = {};
  4330. return val;
  4331. }
  4332. String name = i->token.string;
  4333. Entity *e = entity_of_node(expr);
  4334. return lb_build_addr_from_entity(p, e, expr);
  4335. case_end;
  4336. case_ast_node(se, SelectorExpr, expr);
  4337. Ast *sel_node = unparen_expr(se->selector);
  4338. if (sel_node->kind == Ast_Ident) {
  4339. String selector = sel_node->Ident.token.string;
  4340. TypeAndValue tav = type_and_value_of_expr(se->expr);
  4341. if (tav.mode == Addressing_Invalid) {
  4342. // NOTE(bill): Imports
  4343. Entity *imp = entity_of_node(se->expr);
  4344. if (imp != nullptr) {
  4345. GB_ASSERT(imp->kind == Entity_ImportName);
  4346. }
  4347. return lb_build_addr(p, unparen_expr(se->selector));
  4348. }
  4349. Type *type = base_type(tav.type);
  4350. if (tav.mode == Addressing_Type) { // Addressing_Type
  4351. Selection sel = lookup_field(tav.type, selector, true);
  4352. if (sel.pseudo_field) {
  4353. GB_ASSERT(sel.entity->kind == Entity_Procedure || sel.entity->kind == Entity_ProcGroup);
  4354. Entity *e = entity_of_node(sel_node);
  4355. GB_ASSERT(e->kind == Entity_Procedure);
  4356. return lb_addr(lb_find_value_from_entity(p->module, e));
  4357. }
  4358. GB_PANIC("Unreachable %.*s", LIT(selector));
  4359. }
  4360. if (se->swizzle_count > 0) {
  4361. Type *array_type = base_type(type_deref(tav.type));
  4362. GB_ASSERT(array_type->kind == Type_Array || array_type->kind == Type_SimdVector);
  4363. u8 swizzle_count = se->swizzle_count;
  4364. u8 swizzle_indices_raw = se->swizzle_indices;
  4365. u8 swizzle_indices[4] = {};
  4366. for (u8 i = 0; i < swizzle_count; i++) {
  4367. u8 index = swizzle_indices_raw>>(i*2) & 3;
  4368. swizzle_indices[i] = index;
  4369. }
  4370. lbValue a = {};
  4371. if (is_type_pointer(tav.type)) {
  4372. a = lb_build_expr(p, se->expr);
  4373. } else {
  4374. lbAddr addr = lb_build_addr(p, se->expr);
  4375. a = lb_addr_get_ptr(p, addr);
  4376. }
  4377. Type *type = type_deref(expr->tav.type);
  4378. GB_ASSERT(is_type_array(type) || is_type_simd_vector(type));
  4379. return lb_addr_swizzle(a, type, swizzle_count, swizzle_indices);
  4380. }
  4381. Selection sel = lookup_field(type, selector, false);
  4382. GB_ASSERT(sel.entity != nullptr);
  4383. if (sel.pseudo_field) {
  4384. GB_ASSERT(sel.entity->kind == Entity_Procedure || sel.entity->kind == Entity_ProcGroup);
  4385. Entity *e = entity_of_node(sel_node);
  4386. GB_ASSERT(e->kind == Entity_Procedure);
  4387. return lb_addr(lb_find_value_from_entity(p->module, e));
  4388. }
  4389. if (sel.is_bit_field) {
  4390. lbAddr addr = lb_build_addr(p, se->expr);
  4391. Selection sub_sel = sel;
  4392. sub_sel.index.count -= 1;
  4393. lbValue ptr = lb_addr_get_ptr(p, addr);
  4394. if (sub_sel.index.count > 0) {
  4395. ptr = lb_emit_deep_field_gep(p, ptr, sub_sel);
  4396. }
  4397. if (is_type_pointer(type_deref(ptr.type))) {
  4398. ptr = lb_emit_load(p, ptr);
  4399. }
  4400. Type *bf_type = type_deref(ptr.type);
  4401. bf_type = base_type(bf_type);
  4402. GB_ASSERT(bf_type->kind == Type_BitField);
  4403. i32 index = sel.index[sel.index.count-1];
  4404. Entity *f = bf_type->BitField.fields[index];
  4405. u8 bit_size = bf_type->BitField.bit_sizes[index];
  4406. i64 bit_offset = bf_type->BitField.bit_offsets[index];
  4407. return lb_addr_bit_field(ptr, f->type, bit_offset, bit_size);
  4408. }
  4409. {
  4410. lbAddr addr = lb_build_addr(p, se->expr);
  4411. if (addr.kind == lbAddr_Map) {
  4412. lbValue v = lb_addr_load(p, addr);
  4413. lbValue a = lb_address_from_load_or_generate_local(p, v);
  4414. a = lb_emit_deep_field_gep(p, a, sel);
  4415. return lb_addr(a);
  4416. } else if (addr.kind == lbAddr_Context) {
  4417. GB_ASSERT(sel.index.count > 0);
  4418. if (addr.ctx.sel.index.count >= 0) {
  4419. sel = selection_combine(addr.ctx.sel, sel);
  4420. }
  4421. addr.ctx.sel = sel;
  4422. addr.kind = lbAddr_Context;
  4423. return addr;
  4424. } else if (addr.kind == lbAddr_SoaVariable) {
  4425. lbValue index = addr.soa.index;
  4426. i32 first_index = sel.index[0];
  4427. Selection sub_sel = sel;
  4428. sub_sel.index.data += 1;
  4429. sub_sel.index.count -= 1;
  4430. lbValue arr = lb_emit_struct_ep(p, addr.addr, first_index);
  4431. Type *t = base_type(type_deref(addr.addr.type));
  4432. GB_ASSERT(is_type_soa_struct(t));
  4433. if (addr.soa.index_expr != nullptr && (!lb_is_const(addr.soa.index) || t->Struct.soa_kind != StructSoa_Fixed)) {
  4434. lbValue len = lb_soa_struct_len(p, addr.addr);
  4435. lb_emit_bounds_check(p, ast_token(addr.soa.index_expr), addr.soa.index, len);
  4436. }
  4437. lbValue item = {};
  4438. if (t->Struct.soa_kind == StructSoa_Fixed) {
  4439. item = lb_emit_array_ep(p, arr, index);
  4440. } else {
  4441. item = lb_emit_ptr_offset(p, lb_emit_load(p, arr), index);
  4442. }
  4443. if (sub_sel.index.count > 0) {
  4444. item = lb_emit_deep_field_gep(p, item, sub_sel);
  4445. }
  4446. // make sure it's ^T and not [^]T
  4447. item.type = alloc_type_multi_pointer_to_pointer(item.type);
  4448. return lb_addr(item);
  4449. } else if (addr.kind == lbAddr_Swizzle) {
  4450. GB_ASSERT(sel.index.count > 0);
  4451. // NOTE(bill): just patch the index in place
  4452. sel.index[0] = addr.swizzle.indices[sel.index[0]];
  4453. } else if (addr.kind == lbAddr_SwizzleLarge) {
  4454. GB_ASSERT(sel.index.count > 0);
  4455. // NOTE(bill): just patch the index in place
  4456. sel.index[0] = addr.swizzle.indices[sel.index[0]];
  4457. }
  4458. Type *atype = type_deref(lb_addr_type(addr));
  4459. if (is_type_soa_struct(atype)) {
  4460. map_set(&p->selector_addr, expr, addr);
  4461. }
  4462. lbValue a = lb_addr_get_ptr(p, addr);
  4463. a = lb_emit_deep_field_gep(p, a, sel);
  4464. return lb_addr(a);
  4465. }
  4466. } else {
  4467. GB_PANIC("Unsupported selector expression");
  4468. }
  4469. case_end;
  4470. case_ast_node(se, SelectorCallExpr, expr);
  4471. lbValue e = lb_build_expr(p, expr);
  4472. return lb_addr(lb_address_from_load_or_generate_local(p, e));
  4473. case_end;
  4474. case_ast_node(ta, TypeAssertion, expr);
  4475. TokenPos pos = ast_token(expr).pos;
  4476. lbValue e = lb_build_expr(p, ta->expr);
  4477. Type *t = type_deref(e.type);
  4478. if (is_type_union(t)) {
  4479. Type *type = type_of_expr(expr);
  4480. lbAddr v = lb_add_local_generated(p, type, false);
  4481. lb_addr_store(p, v, lb_emit_union_cast(p, lb_build_expr(p, ta->expr), type, pos));
  4482. return v;
  4483. } else if (is_type_any(t)) {
  4484. Type *type = type_of_expr(expr);
  4485. return lb_emit_any_cast_addr(p, lb_build_expr(p, ta->expr), type, pos);
  4486. } else {
  4487. GB_PANIC("TODO(bill): type assertion %s", type_to_string(e.type));
  4488. }
  4489. case_end;
  4490. case_ast_node(ue, UnaryExpr, expr);
  4491. switch (ue->op.kind) {
  4492. case Token_And: {
  4493. lbValue ptr = lb_build_expr(p, expr);
  4494. return lb_addr(lb_address_from_load_or_generate_local(p, ptr));
  4495. }
  4496. default:
  4497. GB_PANIC("Invalid unary expression for lb_build_addr");
  4498. }
  4499. case_end;
  4500. case_ast_node(be, BinaryExpr, expr);
  4501. lbValue v = lb_build_expr(p, expr);
  4502. Type *t = v.type;
  4503. if (is_type_pointer(t)) {
  4504. return lb_addr(v);
  4505. }
  4506. return lb_addr(lb_address_from_load_or_generate_local(p, v));
  4507. case_end;
  4508. case_ast_node(ie, IndexExpr, expr);
  4509. return lb_build_addr_index_expr(p, expr);
  4510. case_end;
  4511. case_ast_node(ie, MatrixIndexExpr, expr);
  4512. Type *t = base_type(type_of_expr(ie->expr));
  4513. bool deref = is_type_pointer(t);
  4514. t = base_type(type_deref(t));
  4515. lbValue m = {};
  4516. m = lb_build_addr_ptr(p, ie->expr);
  4517. if (deref) {
  4518. m = lb_emit_load(p, m);
  4519. }
  4520. lbValue row_index = lb_build_expr(p, ie->row_index);
  4521. lbValue column_index = lb_build_expr(p, ie->column_index);
  4522. row_index = lb_emit_conv(p, row_index, t_int);
  4523. column_index = lb_emit_conv(p, column_index, t_int);
  4524. lbValue elem = lb_emit_matrix_ep(p, m, row_index, column_index);
  4525. auto row_index_tv = type_and_value_of_expr(ie->row_index);
  4526. auto column_index_tv = type_and_value_of_expr(ie->column_index);
  4527. if (row_index_tv.mode != Addressing_Constant || column_index_tv.mode != Addressing_Constant) {
  4528. lbValue row_count = lb_const_int(p->module, t_int, t->Matrix.row_count);
  4529. lbValue column_count = lb_const_int(p->module, t_int, t->Matrix.column_count);
  4530. lb_emit_matrix_bounds_check(p, ast_token(ie->row_index), row_index, column_index, row_count, column_count);
  4531. }
  4532. return lb_addr(elem);
  4533. case_end;
  4534. case_ast_node(se, SliceExpr, expr);
  4535. return lb_build_addr_slice_expr(p, expr);
  4536. case_end;
  4537. case_ast_node(de, DerefExpr, expr);
  4538. Type *t = type_of_expr(de->expr);
  4539. if (is_type_soa_pointer(t)) {
  4540. lbValue value = lb_build_expr(p, de->expr);
  4541. lbValue ptr = lb_emit_struct_ev(p, value, 0);
  4542. lbValue idx = lb_emit_struct_ev(p, value, 1);
  4543. return lb_addr_soa_variable(ptr, idx, nullptr);
  4544. }
  4545. lbValue addr = lb_build_expr(p, de->expr);
  4546. return lb_addr(addr);
  4547. case_end;
  4548. case_ast_node(ce, CallExpr, expr);
  4549. BuiltinProcId builtin_id = BuiltinProc_Invalid;
  4550. if (ce->proc->tav.mode == Addressing_Builtin) {
  4551. Entity *e = entity_of_node(ce->proc);
  4552. if (e != nullptr) {
  4553. builtin_id = cast(BuiltinProcId)e->Builtin.id;
  4554. } else {
  4555. builtin_id = BuiltinProc_DIRECTIVE;
  4556. }
  4557. }
  4558. auto const &tv = expr->tav;
  4559. if (builtin_id == BuiltinProc_swizzle &&
  4560. is_type_array(tv.type)) {
  4561. // NOTE(bill, 2021-08-09): `swizzle` has some bizarre semantics so it needs to be
  4562. // specialized here for to be addressable
  4563. return lb_build_array_swizzle_addr(p, ce, tv);
  4564. }
  4565. // NOTE(bill): This is make sure you never need to have an 'array_ev'
  4566. lbValue e = lb_build_expr(p, expr);
  4567. #if 1
  4568. return lb_addr(lb_address_from_load_or_generate_local(p, e));
  4569. #else
  4570. lbAddr v = lb_add_local_generated(p, e.type, false);
  4571. lb_addr_store(p, v, e);
  4572. return v;
  4573. #endif
  4574. case_end;
  4575. case_ast_node(cl, CompoundLit, expr);
  4576. return lb_build_addr_compound_lit(p, expr);
  4577. case_end;
  4578. case_ast_node(tc, TypeCast, expr);
  4579. Type *type = type_of_expr(expr);
  4580. lbValue x = lb_build_expr(p, tc->expr);
  4581. lbValue e = {};
  4582. switch (tc->token.kind) {
  4583. case Token_cast:
  4584. e = lb_emit_conv(p, x, type);
  4585. break;
  4586. case Token_transmute:
  4587. e = lb_emit_transmute(p, x, type);
  4588. break;
  4589. default:
  4590. GB_PANIC("Invalid AST TypeCast");
  4591. }
  4592. lbAddr v = lb_add_local_generated(p, type, false);
  4593. lb_addr_store(p, v, e);
  4594. return v;
  4595. case_end;
  4596. case_ast_node(ac, AutoCast, expr);
  4597. return lb_build_addr(p, ac->expr);
  4598. case_end;
  4599. case_ast_node(te, TernaryIfExpr, expr);
  4600. LLVMValueRef incoming_values[2] = {};
  4601. LLVMBasicBlockRef incoming_blocks[2] = {};
  4602. GB_ASSERT(te->y != nullptr);
  4603. lbBlock *then = lb_create_block(p, "if.then");
  4604. lbBlock *done = lb_create_block(p, "if.done"); // NOTE(bill): Append later
  4605. lbBlock *else_ = lb_create_block(p, "if.else");
  4606. lb_build_cond(p, te->cond, then, else_);
  4607. lb_start_block(p, then);
  4608. Type *ptr_type = alloc_type_pointer(default_type(type_of_expr(expr)));
  4609. incoming_values[0] = lb_emit_conv(p, lb_build_addr_ptr(p, te->x), ptr_type).value;
  4610. lb_emit_jump(p, done);
  4611. lb_start_block(p, else_);
  4612. incoming_values[1] = lb_emit_conv(p, lb_build_addr_ptr(p, te->y), ptr_type).value;
  4613. lb_emit_jump(p, done);
  4614. lb_start_block(p, done);
  4615. lbValue res = {};
  4616. res.value = LLVMBuildPhi(p->builder, lb_type(p->module, ptr_type), "");
  4617. res.type = ptr_type;
  4618. GB_ASSERT(p->curr_block->preds.count >= 2);
  4619. incoming_blocks[0] = p->curr_block->preds[0]->block;
  4620. incoming_blocks[1] = p->curr_block->preds[1]->block;
  4621. LLVMAddIncoming(res.value, incoming_values, incoming_blocks, 2);
  4622. return lb_addr(res);
  4623. case_end;
  4624. case_ast_node(oe, OrElseExpr, expr);
  4625. lbValue ptr = lb_address_from_load_or_generate_local(p, lb_build_expr(p, expr));
  4626. return lb_addr(ptr);
  4627. case_end;
  4628. case_ast_node(oe, OrReturnExpr, expr);
  4629. lbValue ptr = lb_address_from_load_or_generate_local(p, lb_build_expr(p, expr));
  4630. return lb_addr(ptr);
  4631. case_end;
  4632. case_ast_node(be, OrBranchExpr, expr);
  4633. lbBlock *block = nullptr;
  4634. if (be->label != nullptr) {
  4635. lbBranchBlocks bb = lb_lookup_branch_blocks(p, be->label);
  4636. switch (be->token.kind) {
  4637. case Token_or_break: block = bb.break_; break;
  4638. case Token_or_continue: block = bb.continue_; break;
  4639. }
  4640. } else {
  4641. for (lbTargetList *t = p->target_list; t != nullptr && block == nullptr; t = t->prev) {
  4642. if (t->is_block) {
  4643. continue;
  4644. }
  4645. switch (be->token.kind) {
  4646. case Token_or_break: block = t->break_; break;
  4647. case Token_or_continue: block = t->continue_; break;
  4648. }
  4649. }
  4650. }
  4651. GB_ASSERT(block != nullptr);
  4652. TypeAndValue tv = expr->tav;
  4653. lbValue lhs = {};
  4654. lbValue rhs = {};
  4655. lb_emit_try_lhs_rhs(p, be->expr, tv, &lhs, &rhs);
  4656. Type *type = default_type(tv.type);
  4657. if (lhs.value) {
  4658. lhs = lb_emit_conv(p, lhs, type);
  4659. } else if (type != nullptr && type != t_invalid) {
  4660. lhs = lb_const_nil(p->module, type);
  4661. }
  4662. lbBlock *then = lb_create_block(p, "or_branch.then");
  4663. lbBlock *else_ = lb_create_block(p, "or_branch.else");
  4664. lb_emit_if(p, lb_emit_try_has_value(p, rhs), then, else_);
  4665. lb_start_block(p, else_);
  4666. lb_emit_defer_stmts(p, lbDeferExit_Branch, block, expr);
  4667. lb_emit_jump(p, block);
  4668. lb_start_block(p, then);
  4669. return lb_addr(lb_address_from_load_or_generate_local(p, lhs));
  4670. case_end;
  4671. }
  4672. TokenPos token_pos = ast_token(expr).pos;
  4673. GB_PANIC("Unexpected address expression\n"
  4674. "\tAst: %.*s @ "
  4675. "%s\n",
  4676. LIT(ast_strings[expr->kind]),
  4677. token_pos_to_string(token_pos));
  4678. return {};
  4679. }