llvm_backend_expr.cpp 172 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889389038913892389338943895389638973898389939003901390239033904390539063907390839093910391139123913391439153916391739183919392039213922392339243925392639273928392939303931393239333934393539363937393839393940394139423943394439453946394739483949395039513952395339543955395639573958395939603961396239633964396539663967396839693970397139723973397439753976397739783979398039813982398339843985398639873988398939903991399239933994399539963997399839994000400140024003400440054006400740084009401040114012401340144015401640174018401940204021402240234024402540264027402840294030403140324033403440354036403740384039404040414042404340444045404640474048404940504051405240534054405540564057405840594060406140624063406440654066406740684069407040714072407340744075407640774078407940804081408240834084408540864087408840894090409140924093409440954096409740984099410041014102410341044105410641074108410941104111411241134114411541164117411841194120412141224123412441254126412741284129413041314132413341344135413641374138413941404141414241434144414541464147414841494150415141524153415441554156415741584159416041614162416341644165416641674168416941704171417241734174417541764177417841794180418141824183418441854186418741884189419041914192419341944195419641974198419942004201420242034204420542064207420842094210421142124213421442154216421742184219422042214222422342244225422642274228422942304231423242334234423542364237423842394240424142424243424442454246424742484249425042514252425342544255425642574258425942604261426242634264426542664267426842694270427142724273427442754276427742784279428042814282428342844285428642874288428942904291429242934294429542964297429842994300430143024303430443054306430743084309431043114312431343144315431643174318431943204321432243234324432543264327432843294330433143324333433443354336433743384339434043414342434343444345434643474348434943504351435243534354435543564357435843594360436143624363436443654366436743684369437043714372437343744375437643774378437943804381438243834384438543864387438843894390439143924393439443954396439743984399440044014402440344044405440644074408440944104411441244134414441544164417441844194420442144224423442444254426442744284429443044314432443344344435443644374438443944404441444244434444444544464447444844494450445144524453445444554456445744584459446044614462446344644465446644674468446944704471447244734474447544764477447844794480448144824483448444854486448744884489449044914492449344944495449644974498449945004501450245034504450545064507450845094510451145124513451445154516451745184519452045214522452345244525452645274528452945304531453245334534453545364537453845394540454145424543454445454546454745484549455045514552455345544555455645574558455945604561456245634564456545664567456845694570457145724573457445754576457745784579458045814582458345844585458645874588458945904591459245934594459545964597459845994600460146024603460446054606460746084609461046114612461346144615461646174618461946204621462246234624462546264627462846294630463146324633463446354636463746384639464046414642464346444645464646474648464946504651465246534654465546564657465846594660466146624663466446654666466746684669467046714672467346744675467646774678467946804681468246834684468546864687468846894690469146924693469446954696469746984699470047014702470347044705470647074708470947104711471247134714471547164717471847194720472147224723472447254726472747284729473047314732473347344735473647374738473947404741474247434744474547464747474847494750475147524753475447554756475747584759476047614762476347644765476647674768476947704771477247734774477547764777477847794780478147824783478447854786478747884789479047914792479347944795479647974798479948004801480248034804480548064807480848094810481148124813481448154816481748184819482048214822482348244825482648274828482948304831483248334834483548364837483848394840484148424843484448454846484748484849485048514852485348544855485648574858485948604861486248634864486548664867486848694870487148724873487448754876487748784879488048814882488348844885488648874888488948904891489248934894489548964897489848994900490149024903490449054906490749084909491049114912491349144915491649174918491949204921492249234924492549264927492849294930493149324933493449354936493749384939494049414942494349444945494649474948494949504951495249534954495549564957495849594960496149624963496449654966496749684969497049714972497349744975497649774978497949804981498249834984498549864987498849894990499149924993499449954996499749984999500050015002500350045005500650075008500950105011501250135014501550165017501850195020502150225023502450255026502750285029503050315032503350345035503650375038503950405041504250435044504550465047504850495050505150525053505450555056505750585059506050615062506350645065506650675068506950705071507250735074507550765077507850795080508150825083508450855086508750885089509050915092509350945095509650975098509951005101510251035104510551065107510851095110511151125113511451155116511751185119512051215122512351245125512651275128512951305131513251335134513551365137513851395140514151425143514451455146514751485149515051515152515351545155515651575158515951605161516251635164516551665167516851695170517151725173517451755176517751785179518051815182518351845185518651875188518951905191519251935194519551965197519851995200520152025203520452055206520752085209521052115212521352145215521652175218521952205221522252235224522552265227522852295230523152325233523452355236523752385239524052415242524352445245524652475248524952505251525252535254525552565257525852595260526152625263526452655266526752685269527052715272527352745275527652775278527952805281528252835284528552865287528852895290529152925293529452955296529752985299530053015302530353045305530653075308530953105311531253135314531553165317531853195320532153225323532453255326532753285329533053315332533353345335533653375338533953405341534253435344534553465347534853495350535153525353535453555356535753585359536053615362536353645365536653675368536953705371537253735374537553765377537853795380538153825383538453855386538753885389539053915392539353945395539653975398539954005401540254035404540554065407540854095410541154125413541454155416541754185419542054215422542354245425542654275428542954305431543254335434543554365437543854395440544154425443544454455446544754485449545054515452545354545455545654575458545954605461546254635464546554665467546854695470547154725473547454755476547754785479548054815482548354845485548654875488548954905491549254935494549554965497549854995500550155025503550455055506550755085509551055115512
  1. gb_internal lbValue lb_emit_arith_matrix(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type, bool component_wise);
  2. gb_internal lbValue lb_emit_logical_binary_expr(lbProcedure *p, TokenKind op, Ast *left, Ast *right, Type *final_type) {
  3. lbModule *m = p->module;
  4. lbBlock *rhs = lb_create_block(p, "logical.cmp.rhs");
  5. lbBlock *done = lb_create_block(p, "logical.cmp.done");
  6. lbValue short_circuit = {};
  7. if (op == Token_CmpAnd) {
  8. lb_build_cond(p, left, rhs, done);
  9. short_circuit = lb_const_bool(m, t_llvm_bool, false);
  10. } else if (op == Token_CmpOr) {
  11. lb_build_cond(p, left, done, rhs);
  12. short_circuit = lb_const_bool(m, t_llvm_bool, true);
  13. }
  14. if (rhs->preds.count == 0) {
  15. lb_start_block(p, done);
  16. return short_circuit;
  17. }
  18. if (done->preds.count == 0) {
  19. lb_start_block(p, rhs);
  20. if (lb_is_expr_untyped_const(right)) {
  21. return lb_expr_untyped_const_to_typed(m, right, default_type(final_type));
  22. }
  23. return lb_build_expr(p, right);
  24. }
  25. Array<LLVMValueRef> incoming_values = {};
  26. Array<LLVMBasicBlockRef> incoming_blocks = {};
  27. array_init(&incoming_values, heap_allocator(), done->preds.count+1);
  28. array_init(&incoming_blocks, heap_allocator(), done->preds.count+1);
  29. for_array(i, done->preds) {
  30. incoming_values[i] = short_circuit.value;
  31. incoming_blocks[i] = done->preds[i]->block;
  32. }
  33. lb_start_block(p, rhs);
  34. lbValue edge = {};
  35. if (lb_is_expr_untyped_const(right)) {
  36. edge = lb_expr_untyped_const_to_typed(m, right, t_llvm_bool);
  37. } else {
  38. edge = lb_emit_conv(p, lb_build_expr(p, right), t_llvm_bool);
  39. }
  40. GB_ASSERT(edge.type == t_llvm_bool);
  41. incoming_values[done->preds.count] = edge.value;
  42. incoming_blocks[done->preds.count] = p->curr_block->block;
  43. lb_emit_jump(p, done);
  44. lb_start_block(p, done);
  45. LLVMTypeRef dst_type = lb_type(m, t_llvm_bool);
  46. LLVMValueRef phi = nullptr;
  47. GB_ASSERT(incoming_values.count == incoming_blocks.count);
  48. GB_ASSERT(incoming_values.count > 0);
  49. LLVMTypeRef phi_type = nullptr;
  50. for (LLVMValueRef incoming_value : incoming_values) {
  51. if (!LLVMIsConstant(incoming_value)) {
  52. phi_type = LLVMTypeOf(incoming_value);
  53. break;
  54. }
  55. }
  56. lbValue res = {};
  57. if (phi_type == nullptr) {
  58. phi = LLVMBuildPhi(p->builder, dst_type, "");
  59. LLVMAddIncoming(phi, incoming_values.data, incoming_blocks.data, cast(unsigned)incoming_values.count);
  60. res.value = phi;
  61. res.type = t_llvm_bool;
  62. } else {
  63. for_array(i, incoming_values) {
  64. LLVMValueRef incoming_value = incoming_values[i];
  65. LLVMTypeRef incoming_type = LLVMTypeOf(incoming_value);
  66. if (phi_type != incoming_type) {
  67. GB_ASSERT_MSG(LLVMIsConstant(incoming_value), "%s vs %s", LLVMPrintTypeToString(phi_type), LLVMPrintTypeToString(incoming_type));
  68. bool ok = !!LLVMConstIntGetZExtValue(incoming_value);
  69. incoming_values[i] = LLVMConstInt(phi_type, ok, false);
  70. }
  71. }
  72. // NOTE(bill): this now only uses i1 for the logic to prevent issues with corrupted booleans which are not of value 0 or 1 (e.g. 2)
  73. // Doing this may produce slightly worse code as a result but it will be correct behaviour
  74. phi = LLVMBuildPhi(p->builder, phi_type, "");
  75. LLVMAddIncoming(phi, incoming_values.data, incoming_blocks.data, cast(unsigned)incoming_values.count);
  76. res.value = phi;
  77. res.type = t_llvm_bool;
  78. }
  79. return lb_emit_conv(p, res, default_type(final_type));
  80. }
  81. gb_internal lbValue lb_emit_unary_arith(lbProcedure *p, TokenKind op, lbValue x, Type *type) {
  82. switch (op) {
  83. case Token_Add:
  84. return x;
  85. case Token_Not: // Boolean not
  86. case Token_Xor: // Bitwise not
  87. case Token_Sub: // Number negation
  88. break;
  89. case Token_Pointer:
  90. GB_PANIC("This should be handled elsewhere");
  91. break;
  92. }
  93. if (is_type_array_like(x.type)) {
  94. // IMPORTANT TODO(bill): This is very wasteful with regards to stack memory
  95. Type *tl = base_type(x.type);
  96. lbValue val = lb_address_from_load_or_generate_local(p, x);
  97. GB_ASSERT(is_type_array_like(type));
  98. Type *elem_type = base_array_type(type);
  99. // NOTE(bill): Doesn't need to be zero because it will be initialized in the loops
  100. lbAddr res_addr = lb_add_local(p, type, nullptr, false, true);
  101. lbValue res = lb_addr_get_ptr(p, res_addr);
  102. bool inline_array_arith = lb_can_try_to_inline_array_arith(type);
  103. i32 count = cast(i32)get_array_type_count(tl);
  104. LLVMTypeRef vector_type = nullptr;
  105. if (op != Token_Not && lb_try_vector_cast(p->module, val, &vector_type)) {
  106. LLVMValueRef vp = LLVMBuildPointerCast(p->builder, val.value, LLVMPointerType(vector_type, 0), "");
  107. LLVMValueRef v = OdinLLVMBuildLoad(p, vector_type, vp);
  108. LLVMValueRef opv = nullptr;
  109. switch (op) {
  110. case Token_Xor:
  111. opv = LLVMBuildNot(p->builder, v, "");
  112. if (is_type_bit_set(elem_type)) {
  113. ExactValue ev_mask = exact_bit_set_all_set_mask(elem_type);
  114. lbValue mask = lb_const_value(p->module, elem_type, ev_mask);
  115. opv = LLVMBuildAnd(p->builder, opv, mask.value, "");
  116. }
  117. break;
  118. case Token_Sub:
  119. if (is_type_float(elem_type)) {
  120. opv = LLVMBuildFNeg(p->builder, v, "");
  121. } else {
  122. opv = LLVMBuildNeg(p->builder, v, "");
  123. }
  124. break;
  125. }
  126. if (opv != nullptr) {
  127. LLVMSetAlignment(res.value, cast(unsigned)lb_alignof(vector_type));
  128. LLVMValueRef res_ptr = LLVMBuildPointerCast(p->builder, res.value, LLVMPointerType(vector_type, 0), "");
  129. LLVMBuildStore(p->builder, opv, res_ptr);
  130. return lb_emit_conv(p, lb_emit_load(p, res), type);
  131. }
  132. }
  133. if (inline_array_arith) {
  134. // inline
  135. for (i32 i = 0; i < count; i++) {
  136. lbValue e = lb_emit_load(p, lb_emit_array_epi(p, val, i));
  137. lbValue z = lb_emit_unary_arith(p, op, e, elem_type);
  138. lb_emit_store(p, lb_emit_array_epi(p, res, i), z);
  139. }
  140. } else {
  141. auto loop_data = lb_loop_start(p, count, t_i32);
  142. lbValue e = lb_emit_load(p, lb_emit_array_ep(p, val, loop_data.idx));
  143. lbValue z = lb_emit_unary_arith(p, op, e, elem_type);
  144. lb_emit_store(p, lb_emit_array_ep(p, res, loop_data.idx), z);
  145. lb_loop_end(p, loop_data);
  146. }
  147. return lb_emit_load(p, res);
  148. }
  149. if (op == Token_Xor) {
  150. lbValue cmp = {};
  151. cmp.type = x.type;
  152. if (is_type_bit_set(x.type)) {
  153. ExactValue ev_mask = exact_bit_set_all_set_mask(x.type);
  154. lbValue mask = lb_const_value(p->module, x.type, ev_mask);
  155. cmp.value = LLVMBuildXor(p->builder, x.value, mask.value, "");
  156. } else {
  157. cmp.value = LLVMBuildNot(p->builder, x.value, "");
  158. }
  159. return lb_emit_conv(p, cmp, type);
  160. }
  161. if (op == Token_Not) {
  162. lbValue cmp = {};
  163. LLVMValueRef zero = LLVMConstInt(lb_type(p->module, x.type), 0, false);
  164. cmp.value = LLVMBuildICmp(p->builder, LLVMIntEQ, x.value, zero, "");
  165. cmp.type = t_llvm_bool;
  166. return lb_emit_conv(p, cmp, type);
  167. }
  168. if (op == Token_Sub && is_type_integer(type) && is_type_different_to_arch_endianness(type)) {
  169. Type *platform_type = integer_endian_type_to_platform_type(type);
  170. lbValue v = lb_emit_byte_swap(p, x, platform_type);
  171. lbValue res = {};
  172. res.value = LLVMBuildNeg(p->builder, v.value, "");
  173. res.type = platform_type;
  174. return lb_emit_byte_swap(p, res, type);
  175. }
  176. if (op == Token_Sub && is_type_float(type) && is_type_different_to_arch_endianness(type)) {
  177. Type *platform_type = integer_endian_type_to_platform_type(type);
  178. lbValue v = lb_emit_byte_swap(p, x, platform_type);
  179. lbValue res = {};
  180. res.value = LLVMBuildFNeg(p->builder, v.value, "");
  181. res.type = platform_type;
  182. return lb_emit_byte_swap(p, res, type);
  183. }
  184. lbValue res = {};
  185. switch (op) {
  186. case Token_Not: // Boolean not
  187. case Token_Xor: // Bitwise not
  188. res.value = LLVMBuildNot(p->builder, x.value, "");
  189. res.type = x.type;
  190. return res;
  191. case Token_Sub: // Number negation
  192. if (is_type_integer(x.type)) {
  193. res.value = LLVMBuildNeg(p->builder, x.value, "");
  194. } else if (is_type_float(x.type)) {
  195. res.value = LLVMBuildFNeg(p->builder, x.value, "");
  196. } else if (is_type_complex(x.type)) {
  197. LLVMValueRef v0 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 0, ""), "");
  198. LLVMValueRef v1 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 1, ""), "");
  199. lbAddr addr = lb_add_local_generated(p, x.type, false);
  200. LLVMTypeRef type = llvm_addr_type(p->module, addr.addr);
  201. LLVMBuildStore(p->builder, v0, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 0, ""));
  202. LLVMBuildStore(p->builder, v1, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 1, ""));
  203. return lb_addr_load(p, addr);
  204. } else if (is_type_quaternion(x.type)) {
  205. LLVMValueRef v0 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 0, ""), "");
  206. LLVMValueRef v1 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 1, ""), "");
  207. LLVMValueRef v2 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 2, ""), "");
  208. LLVMValueRef v3 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 3, ""), "");
  209. lbAddr addr = lb_add_local_generated(p, x.type, false);
  210. LLVMTypeRef type = llvm_addr_type(p->module, addr.addr);
  211. LLVMBuildStore(p->builder, v0, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 0, ""));
  212. LLVMBuildStore(p->builder, v1, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 1, ""));
  213. LLVMBuildStore(p->builder, v2, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 2, ""));
  214. LLVMBuildStore(p->builder, v3, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 3, ""));
  215. return lb_addr_load(p, addr);
  216. } else if (is_type_simd_vector(x.type)) {
  217. Type *elem = base_array_type(x.type);
  218. if (is_type_float(elem)) {
  219. res.value = LLVMBuildFNeg(p->builder, x.value, "");
  220. } else {
  221. res.value = LLVMBuildNeg(p->builder, x.value, "");
  222. }
  223. } else if (is_type_matrix(x.type)) {
  224. lbValue zero = {};
  225. zero.value = LLVMConstNull(lb_type(p->module, type));
  226. zero.type = type;
  227. return lb_emit_arith_matrix(p, Token_Sub, zero, x, type, true);
  228. } else {
  229. GB_PANIC("Unhandled type %s", type_to_string(x.type));
  230. }
  231. res.type = x.type;
  232. return res;
  233. }
  234. return res;
  235. }
  236. gb_internal bool lb_try_direct_vector_arith(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type, lbValue *res_) {
  237. GB_ASSERT(is_type_array_like(type));
  238. Type *elem_type = base_array_type(type);
  239. // NOTE(bill): Shift operations cannot be easily dealt with due to Odin's semantics
  240. if (op == Token_Shl || op == Token_Shr) {
  241. return false;
  242. }
  243. if (!LLVMIsALoadInst(lhs.value) || !LLVMIsALoadInst(rhs.value)) {
  244. return false;
  245. }
  246. lbValue lhs_ptr = {};
  247. lbValue rhs_ptr = {};
  248. lhs_ptr.value = LLVMGetOperand(lhs.value, 0);
  249. lhs_ptr.type = alloc_type_pointer(lhs.type);
  250. rhs_ptr.value = LLVMGetOperand(rhs.value, 0);
  251. rhs_ptr.type = alloc_type_pointer(rhs.type);
  252. LLVMTypeRef vector_type0 = nullptr;
  253. LLVMTypeRef vector_type1 = nullptr;
  254. if (lb_try_vector_cast(p->module, lhs_ptr, &vector_type0) &&
  255. lb_try_vector_cast(p->module, rhs_ptr, &vector_type1)) {
  256. GB_ASSERT(vector_type0 == vector_type1);
  257. LLVMTypeRef vector_type = vector_type0;
  258. Type *integral_type = base_type(elem_type);
  259. if (is_type_simd_vector(integral_type)) {
  260. integral_type = core_array_type(integral_type);
  261. }
  262. if (is_type_bit_set(integral_type)) {
  263. switch (op) {
  264. case Token_Add: op = Token_Or; break;
  265. case Token_Sub: op = Token_AndNot; break;
  266. }
  267. Type *u = bit_set_to_int(type);
  268. if (is_type_array(u)) {
  269. return false;
  270. }
  271. }
  272. LLVMValueRef lhs_vp = LLVMBuildPointerCast(p->builder, lhs_ptr.value, LLVMPointerType(vector_type, 0), "");
  273. LLVMValueRef rhs_vp = LLVMBuildPointerCast(p->builder, rhs_ptr.value, LLVMPointerType(vector_type, 0), "");
  274. LLVMValueRef x = OdinLLVMBuildLoad(p, vector_type, lhs_vp);
  275. LLVMValueRef y = OdinLLVMBuildLoad(p, vector_type, rhs_vp);
  276. LLVMValueRef z = nullptr;
  277. if (is_type_float(integral_type)) {
  278. switch (op) {
  279. case Token_Add:
  280. z = LLVMBuildFAdd(p->builder, x, y, "");
  281. break;
  282. case Token_Sub:
  283. z = LLVMBuildFSub(p->builder, x, y, "");
  284. break;
  285. case Token_Mul:
  286. z = LLVMBuildFMul(p->builder, x, y, "");
  287. break;
  288. case Token_Quo:
  289. z = LLVMBuildFDiv(p->builder, x, y, "");
  290. break;
  291. case Token_Mod:
  292. z = LLVMBuildFRem(p->builder, x, y, "");
  293. break;
  294. default:
  295. GB_PANIC("Unsupported vector operation %.*s", LIT(token_strings[op]));
  296. break;
  297. }
  298. } else {
  299. switch (op) {
  300. case Token_Add:
  301. z = LLVMBuildAdd(p->builder, x, y, "");
  302. break;
  303. case Token_Sub:
  304. z = LLVMBuildSub(p->builder, x, y, "");
  305. break;
  306. case Token_Mul:
  307. z = LLVMBuildMul(p->builder, x, y, "");
  308. break;
  309. case Token_Quo:
  310. if (is_type_unsigned(integral_type)) {
  311. z = LLVMBuildUDiv(p->builder, x, y, "");
  312. } else {
  313. z = LLVMBuildSDiv(p->builder, x, y, "");
  314. }
  315. break;
  316. case Token_Mod:
  317. if (is_type_unsigned(integral_type)) {
  318. z = LLVMBuildURem(p->builder, x, y, "");
  319. } else {
  320. z = LLVMBuildSRem(p->builder, x, y, "");
  321. }
  322. break;
  323. case Token_ModMod:
  324. if (is_type_unsigned(integral_type)) {
  325. z = LLVMBuildURem(p->builder, x, y, "");
  326. } else {
  327. LLVMValueRef a = LLVMBuildSRem(p->builder, x, y, "");
  328. LLVMValueRef b = LLVMBuildAdd(p->builder, a, y, "");
  329. z = LLVMBuildSRem(p->builder, b, y, "");
  330. }
  331. break;
  332. case Token_And:
  333. z = LLVMBuildAnd(p->builder, x, y, "");
  334. break;
  335. case Token_AndNot:
  336. z = LLVMBuildAnd(p->builder, x, LLVMBuildNot(p->builder, y, ""), "");
  337. break;
  338. case Token_Or:
  339. z = LLVMBuildOr(p->builder, x, y, "");
  340. break;
  341. case Token_Xor:
  342. z = LLVMBuildXor(p->builder, x, y, "");
  343. break;
  344. default:
  345. GB_PANIC("Unsupported vector operation");
  346. break;
  347. }
  348. }
  349. if (z != nullptr) {
  350. lbAddr res = lb_add_local_generated_temp(p, type, lb_alignof(vector_type));
  351. LLVMValueRef vp = LLVMBuildPointerCast(p->builder, res.addr.value, LLVMPointerType(vector_type, 0), "");
  352. LLVMBuildStore(p->builder, z, vp);
  353. lbValue v = lb_addr_load(p, res);
  354. if (res_) *res_ = v;
  355. return true;
  356. }
  357. }
  358. return false;
  359. }
  360. gb_internal lbValue lb_emit_arith_array(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type) {
  361. GB_ASSERT(is_type_array_like(lhs.type) || is_type_array_like(rhs.type));
  362. lhs = lb_emit_conv(p, lhs, type);
  363. rhs = lb_emit_conv(p, rhs, type);
  364. GB_ASSERT(is_type_array_like(type));
  365. Type *elem_type = base_array_type(type);
  366. i64 count = get_array_type_count(type);
  367. unsigned n = cast(unsigned)count;
  368. // NOTE(bill, 2021-06-12): Try to do a direct operation as a vector, if possible
  369. lbValue direct_vector_res = {};
  370. if (lb_try_direct_vector_arith(p, op, lhs, rhs, type, &direct_vector_res)) {
  371. return direct_vector_res;
  372. }
  373. bool inline_array_arith = lb_can_try_to_inline_array_arith(type);
  374. if (inline_array_arith) {
  375. auto dst_ptrs = slice_make<lbValue>(temporary_allocator(), n);
  376. auto a_loads = slice_make<lbValue>(temporary_allocator(), n);
  377. auto b_loads = slice_make<lbValue>(temporary_allocator(), n);
  378. auto c_ops = slice_make<lbValue>(temporary_allocator(), n);
  379. for (unsigned i = 0; i < n; i++) {
  380. a_loads[i].value = LLVMBuildExtractValue(p->builder, lhs.value, i, "");
  381. a_loads[i].type = elem_type;
  382. }
  383. for (unsigned i = 0; i < n; i++) {
  384. b_loads[i].value = LLVMBuildExtractValue(p->builder, rhs.value, i, "");
  385. b_loads[i].type = elem_type;
  386. }
  387. for (unsigned i = 0; i < n; i++) {
  388. c_ops[i] = lb_emit_arith(p, op, a_loads[i], b_loads[i], elem_type);
  389. }
  390. lbAddr res = lb_add_local_generated(p, type, false);
  391. for (unsigned i = 0; i < n; i++) {
  392. dst_ptrs[i] = lb_emit_array_epi(p, res.addr, i);
  393. }
  394. for (unsigned i = 0; i < n; i++) {
  395. lb_emit_store(p, dst_ptrs[i], c_ops[i]);
  396. }
  397. return lb_addr_load(p, res);
  398. } else {
  399. lbValue x = lb_address_from_load_or_generate_local(p, lhs);
  400. lbValue y = lb_address_from_load_or_generate_local(p, rhs);
  401. lbAddr res = lb_add_local_generated(p, type, false);
  402. auto loop_data = lb_loop_start(p, cast(isize)count, t_i32);
  403. lbValue a_ptr = lb_emit_array_ep(p, x, loop_data.idx);
  404. lbValue b_ptr = lb_emit_array_ep(p, y, loop_data.idx);
  405. lbValue dst_ptr = lb_emit_array_ep(p, res.addr, loop_data.idx);
  406. lbValue a = lb_emit_load(p, a_ptr);
  407. lbValue b = lb_emit_load(p, b_ptr);
  408. lbValue c = lb_emit_arith(p, op, a, b, elem_type);
  409. lb_emit_store(p, dst_ptr, c);
  410. lb_loop_end(p, loop_data);
  411. return lb_addr_load(p, res);
  412. }
  413. }
  414. gb_internal bool lb_is_matrix_simdable(Type *t) {
  415. Type *mt = base_type(t);
  416. GB_ASSERT(mt->kind == Type_Matrix);
  417. Type *elem = core_type(mt->Matrix.elem);
  418. if (is_type_complex(elem)) {
  419. return false;
  420. }
  421. if (is_type_different_to_arch_endianness(elem)) {
  422. return false;
  423. }
  424. switch (build_context.metrics.arch) {
  425. default:
  426. return false;
  427. case TargetArch_amd64:
  428. case TargetArch_arm64:
  429. break;
  430. }
  431. if (type_align_of(t) < 16) {
  432. // it's not aligned well enough to use the vector instructions
  433. return false;
  434. }
  435. if ((mt->Matrix.row_count & 1) ^ (mt->Matrix.column_count & 1)) {
  436. return false;
  437. }
  438. if (mt->Matrix.is_row_major) {
  439. // TODO(bill): make #row_major matrices work with SIMD
  440. return false;
  441. }
  442. if (elem->kind == Type_Basic) {
  443. switch (elem->Basic.kind) {
  444. case Basic_f16:
  445. case Basic_f16le:
  446. case Basic_f16be:
  447. switch (build_context.metrics.arch) {
  448. case TargetArch_amd64:
  449. return false;
  450. case TargetArch_arm64:
  451. // TODO(bill): determine when this is fine
  452. return true;
  453. case TargetArch_i386:
  454. case TargetArch_wasm32:
  455. case TargetArch_wasm64p32:
  456. return false;
  457. }
  458. }
  459. }
  460. return true;
  461. }
  462. gb_internal LLVMValueRef lb_matrix_to_vector(lbProcedure *p, lbValue matrix) {
  463. Type *mt = base_type(matrix.type);
  464. GB_ASSERT(mt->kind == Type_Matrix);
  465. LLVMTypeRef elem_type = lb_type(p->module, mt->Matrix.elem);
  466. unsigned total_count = cast(unsigned)matrix_type_total_internal_elems(mt);
  467. LLVMTypeRef total_matrix_type = LLVMVectorType(elem_type, total_count);
  468. #if 1
  469. LLVMValueRef ptr = lb_address_from_load_or_generate_local(p, matrix).value;
  470. LLVMValueRef matrix_vector_ptr = LLVMBuildPointerCast(p->builder, ptr, LLVMPointerType(total_matrix_type, 0), "");
  471. LLVMValueRef matrix_vector = OdinLLVMBuildLoadAligned(p, total_matrix_type, matrix_vector_ptr, type_align_of(mt));
  472. return matrix_vector;
  473. #else
  474. LLVMValueRef matrix_vector = LLVMBuildBitCast(p->builder, matrix.value, total_matrix_type, "");
  475. return matrix_vector;
  476. #endif
  477. }
  478. gb_internal LLVMValueRef lb_matrix_trimmed_vector_mask(lbProcedure *p, Type *mt) {
  479. mt = base_type(mt);
  480. GB_ASSERT(mt->kind == Type_Matrix);
  481. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  482. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  483. unsigned column_count = cast(unsigned)mt->Matrix.column_count;
  484. unsigned mask_elems_index = 0;
  485. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), row_count*column_count);
  486. for (unsigned j = 0; j < column_count; j++) {
  487. for (unsigned i = 0; i < row_count; i++) {
  488. unsigned offset = stride*j + i;
  489. mask_elems[mask_elems_index++] = lb_const_int(p->module, t_u32, offset).value;
  490. }
  491. }
  492. LLVMValueRef mask = LLVMConstVector(mask_elems.data, cast(unsigned)mask_elems.count);
  493. return mask;
  494. }
  495. gb_internal LLVMValueRef lb_matrix_to_trimmed_vector(lbProcedure *p, lbValue m) {
  496. LLVMValueRef vector = lb_matrix_to_vector(p, m);
  497. Type *mt = base_type(m.type);
  498. GB_ASSERT(mt->kind == Type_Matrix);
  499. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  500. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  501. if (stride == row_count) {
  502. return vector;
  503. }
  504. LLVMValueRef mask = lb_matrix_trimmed_vector_mask(p, mt);
  505. LLVMValueRef trimmed_vector = llvm_basic_shuffle(p, vector, mask);
  506. return trimmed_vector;
  507. }
  508. gb_internal lbValue lb_emit_matrix_tranpose(lbProcedure *p, lbValue m, Type *type) {
  509. if (is_type_array(m.type)) {
  510. i32 rank = type_math_rank(m.type);
  511. if (rank == 2) {
  512. lbAddr addr = lb_add_local_generated(p, type, false);
  513. lbValue dst = addr.addr;
  514. lbValue src = m;
  515. i32 n = cast(i32)get_array_type_count(m.type);
  516. i32 m = cast(i32)get_array_type_count(type);
  517. // m.type == [n][m]T
  518. // type == [m][n]T
  519. for (i32 j = 0; j < m; j++) {
  520. lbValue dst_col = lb_emit_struct_ep(p, dst, j);
  521. for (i32 i = 0; i < n; i++) {
  522. lbValue dst_row = lb_emit_struct_ep(p, dst_col, i);
  523. lbValue src_col = lb_emit_struct_ev(p, src, i);
  524. lbValue src_row = lb_emit_struct_ev(p, src_col, j);
  525. lb_emit_store(p, dst_row, src_row);
  526. }
  527. }
  528. return lb_addr_load(p, addr);
  529. }
  530. // no-op
  531. m.type = type;
  532. return m;
  533. }
  534. Type *mt = base_type(m.type);
  535. GB_ASSERT(mt->kind == Type_Matrix);
  536. if (lb_is_matrix_simdable(mt)) {
  537. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  538. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  539. unsigned column_count = cast(unsigned)mt->Matrix.column_count;
  540. auto rows = slice_make<LLVMValueRef>(permanent_allocator(), row_count);
  541. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  542. LLVMValueRef vector = lb_matrix_to_vector(p, m);
  543. for (unsigned i = 0; i < row_count; i++) {
  544. for (unsigned j = 0; j < column_count; j++) {
  545. unsigned offset = stride*j + i;
  546. mask_elems[j] = lb_const_int(p->module, t_u32, offset).value;
  547. }
  548. // transpose mask
  549. LLVMValueRef mask = LLVMConstVector(mask_elems.data, column_count);
  550. LLVMValueRef row = llvm_basic_shuffle(p, vector, mask);
  551. rows[i] = row;
  552. }
  553. lbAddr res = lb_add_local_generated(p, type, true);
  554. for_array(i, rows) {
  555. LLVMValueRef row = rows[i];
  556. lbValue dst_row_ptr = lb_emit_matrix_epi(p, res.addr, 0, i);
  557. LLVMValueRef ptr = dst_row_ptr.value;
  558. ptr = LLVMBuildPointerCast(p->builder, ptr, LLVMPointerType(LLVMTypeOf(row), 0), "");
  559. LLVMBuildStore(p->builder, row, ptr);
  560. }
  561. return lb_addr_load(p, res);
  562. }
  563. lbAddr res = lb_add_local_generated(p, type, true);
  564. i64 row_count = mt->Matrix.row_count;
  565. i64 column_count = mt->Matrix.column_count;
  566. for (i64 j = 0; j < column_count; j++) {
  567. for (i64 i = 0; i < row_count; i++) {
  568. lbValue src = lb_emit_matrix_ev(p, m, i, j);
  569. lbValue dst = lb_emit_matrix_epi(p, res.addr, j, i);
  570. lb_emit_store(p, dst, src);
  571. }
  572. }
  573. return lb_addr_load(p, res);
  574. }
  575. gb_internal lbValue lb_matrix_cast_vector_to_type(lbProcedure *p, LLVMValueRef vector, Type *type) {
  576. lbAddr res = lb_add_local_generated(p, type, true);
  577. LLVMValueRef res_ptr = res.addr.value;
  578. unsigned alignment = cast(unsigned)gb_max(type_align_of(type), lb_alignof(LLVMTypeOf(vector)));
  579. LLVMSetAlignment(res_ptr, alignment);
  580. res_ptr = LLVMBuildPointerCast(p->builder, res_ptr, LLVMPointerType(LLVMTypeOf(vector), 0), "");
  581. LLVMBuildStore(p->builder, vector, res_ptr);
  582. return lb_addr_load(p, res);
  583. }
  584. gb_internal lbValue lb_emit_matrix_flatten(lbProcedure *p, lbValue m, Type *type) {
  585. if (is_type_array(m.type)) {
  586. // no-op
  587. m.type = type;
  588. return m;
  589. }
  590. Type *mt = base_type(m.type);
  591. GB_ASSERT(mt->kind == Type_Matrix);
  592. lbAddr res = lb_add_local_generated(p, type, true);
  593. GB_ASSERT(type_size_of(type) == type_size_of(m.type));
  594. lbValue m_ptr = lb_address_from_load_or_generate_local(p, m);
  595. lbValue n = lb_const_int(p->module, t_int, type_size_of(type));
  596. lb_mem_copy_non_overlapping(p, res.addr, m_ptr, n);
  597. // i64 row_count = mt->Matrix.row_count;
  598. // i64 column_count = mt->Matrix.column_count;
  599. // TEMPORARY_ALLOCATOR_GUARD();
  600. // auto srcs = array_make<lbValue>(temporary_allocator(), 0, row_count*column_count);
  601. // auto dsts = array_make<lbValue>(temporary_allocator(), 0, row_count*column_count);
  602. // for (i64 j = 0; j < column_count; j++) {
  603. // for (i64 i = 0; i < row_count; i++) {
  604. // lbValue src = lb_emit_matrix_ev(p, m, i, j);
  605. // array_add(&srcs, src);
  606. // }
  607. // }
  608. // for (i64 j = 0; j < column_count; j++) {
  609. // for (i64 i = 0; i < row_count; i++) {
  610. // lbValue dst = lb_emit_array_epi(p, res.addr, i + j*row_count);
  611. // array_add(&dsts, dst);
  612. // }
  613. // }
  614. // GB_ASSERT(srcs.count == dsts.count);
  615. // for_array(i, srcs) {
  616. // lb_emit_store(p, dsts[i], srcs[i]);
  617. // }
  618. return lb_addr_load(p, res);
  619. }
  620. gb_internal lbValue lb_emit_outer_product(lbProcedure *p, lbValue a, lbValue b, Type *type) {
  621. Type *mt = base_type(type);
  622. Type *at = base_type(a.type);
  623. Type *bt = base_type(b.type);
  624. GB_ASSERT(mt->kind == Type_Matrix);
  625. GB_ASSERT(at->kind == Type_Array);
  626. GB_ASSERT(bt->kind == Type_Array);
  627. i64 row_count = mt->Matrix.row_count;
  628. i64 column_count = mt->Matrix.column_count;
  629. GB_ASSERT(row_count == at->Array.count);
  630. GB_ASSERT(column_count == bt->Array.count);
  631. lbAddr res = lb_add_local_generated(p, type, true);
  632. for (i64 j = 0; j < column_count; j++) {
  633. for (i64 i = 0; i < row_count; i++) {
  634. lbValue x = lb_emit_struct_ev(p, a, cast(i32)i);
  635. lbValue y = lb_emit_struct_ev(p, b, cast(i32)j);
  636. lbValue src = lb_emit_arith(p, Token_Mul, x, y, mt->Matrix.elem);
  637. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  638. lb_emit_store(p, dst, src);
  639. }
  640. }
  641. return lb_addr_load(p, res);
  642. }
  643. gb_internal lbValue lb_emit_matrix_mul(lbProcedure *p, lbValue lhs, lbValue rhs, Type *type) {
  644. // TODO(bill): Handle edge case for f16 types on x86(-64) platforms
  645. Type *xt = base_type(lhs.type);
  646. Type *yt = base_type(rhs.type);
  647. GB_ASSERT(is_type_matrix(type));
  648. GB_ASSERT(is_type_matrix(xt));
  649. GB_ASSERT(is_type_matrix(yt));
  650. GB_ASSERT(xt->Matrix.column_count == yt->Matrix.row_count);
  651. GB_ASSERT(are_types_identical(xt->Matrix.elem, yt->Matrix.elem));
  652. GB_ASSERT(xt->Matrix.is_row_major == yt->Matrix.is_row_major);
  653. Type *elem = xt->Matrix.elem;
  654. unsigned outer_rows = cast(unsigned)xt->Matrix.row_count;
  655. unsigned inner = cast(unsigned)xt->Matrix.column_count;
  656. unsigned outer_columns = cast(unsigned)yt->Matrix.column_count;
  657. if (!xt->Matrix.is_row_major && lb_is_matrix_simdable(xt)) {
  658. unsigned x_stride = cast(unsigned)matrix_type_stride_in_elems(xt);
  659. unsigned y_stride = cast(unsigned)matrix_type_stride_in_elems(yt);
  660. auto x_rows = slice_make<LLVMValueRef>(permanent_allocator(), outer_rows);
  661. auto y_columns = slice_make<LLVMValueRef>(permanent_allocator(), outer_columns);
  662. LLVMValueRef x_vector = lb_matrix_to_vector(p, lhs);
  663. LLVMValueRef y_vector = lb_matrix_to_vector(p, rhs);
  664. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), inner);
  665. for (unsigned i = 0; i < outer_rows; i++) {
  666. for (unsigned j = 0; j < inner; j++) {
  667. unsigned offset = x_stride*j + i;
  668. mask_elems[j] = lb_const_int(p->module, t_u32, offset).value;
  669. }
  670. // transpose mask
  671. LLVMValueRef mask = LLVMConstVector(mask_elems.data, inner);
  672. LLVMValueRef row = llvm_basic_shuffle(p, x_vector, mask);
  673. x_rows[i] = row;
  674. }
  675. for (unsigned i = 0; i < outer_columns; i++) {
  676. LLVMValueRef mask = llvm_mask_iota(p->module, y_stride*i, inner);
  677. LLVMValueRef column = llvm_basic_shuffle(p, y_vector, mask);
  678. y_columns[i] = column;
  679. }
  680. lbAddr res = lb_add_local_generated(p, type, true);
  681. for_array(i, x_rows) {
  682. LLVMValueRef x_row = x_rows[i];
  683. for_array(j, y_columns) {
  684. LLVMValueRef y_column = y_columns[j];
  685. LLVMValueRef elem = llvm_vector_dot(p, x_row, y_column);
  686. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  687. LLVMBuildStore(p->builder, elem, dst.value);
  688. }
  689. }
  690. return lb_addr_load(p, res);
  691. }
  692. if (!xt->Matrix.is_row_major) {
  693. lbAddr res = lb_add_local_generated(p, type, true);
  694. auto inners = slice_make<lbValue[2]>(permanent_allocator(), inner);
  695. for (unsigned j = 0; j < outer_columns; j++) {
  696. for (unsigned i = 0; i < outer_rows; i++) {
  697. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  698. for (unsigned k = 0; k < inner; k++) {
  699. inners[k][0] = lb_emit_matrix_ev(p, lhs, i, k);
  700. inners[k][1] = lb_emit_matrix_ev(p, rhs, k, j);
  701. }
  702. lbValue sum = lb_const_nil(p->module, elem);
  703. for (unsigned k = 0; k < inner; k++) {
  704. lbValue a = inners[k][0];
  705. lbValue b = inners[k][1];
  706. sum = lb_emit_mul_add(p, a, b, sum, elem);
  707. }
  708. lb_emit_store(p, dst, sum);
  709. }
  710. }
  711. return lb_addr_load(p, res);
  712. } else {
  713. lbAddr res = lb_add_local_generated(p, type, true);
  714. auto inners = slice_make<lbValue[2]>(permanent_allocator(), inner);
  715. for (unsigned i = 0; i < outer_rows; i++) {
  716. for (unsigned j = 0; j < outer_columns; j++) {
  717. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  718. for (unsigned k = 0; k < inner; k++) {
  719. inners[k][0] = lb_emit_matrix_ev(p, lhs, i, k);
  720. inners[k][1] = lb_emit_matrix_ev(p, rhs, k, j);
  721. }
  722. lbValue sum = lb_const_nil(p->module, elem);
  723. for (unsigned k = 0; k < inner; k++) {
  724. lbValue a = inners[k][0];
  725. lbValue b = inners[k][1];
  726. sum = lb_emit_mul_add(p, a, b, sum, elem);
  727. }
  728. lb_emit_store(p, dst, sum);
  729. }
  730. }
  731. return lb_addr_load(p, res);
  732. }
  733. }
  734. gb_internal lbValue lb_emit_matrix_mul_vector(lbProcedure *p, lbValue lhs, lbValue rhs, Type *type) {
  735. // TODO(bill): Handle edge case for f16 types on x86(-64) platforms
  736. Type *mt = base_type(lhs.type);
  737. Type *vt = base_type(rhs.type);
  738. GB_ASSERT(is_type_matrix(mt));
  739. GB_ASSERT(is_type_array_like(vt));
  740. i64 vector_count = get_array_type_count(vt);
  741. GB_ASSERT(mt->Matrix.column_count == vector_count);
  742. GB_ASSERT(are_types_identical(mt->Matrix.elem, base_array_type(vt)));
  743. Type *elem = mt->Matrix.elem;
  744. if (!mt->Matrix.is_row_major && lb_is_matrix_simdable(mt)) {
  745. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  746. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  747. unsigned column_count = cast(unsigned)mt->Matrix.column_count;
  748. auto m_columns = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  749. auto v_rows = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  750. LLVMValueRef matrix_vector = lb_matrix_to_vector(p, lhs);
  751. for (unsigned column_index = 0; column_index < column_count; column_index++) {
  752. LLVMValueRef mask = llvm_mask_iota(p->module, stride*column_index, row_count);
  753. LLVMValueRef column = llvm_basic_shuffle(p, matrix_vector, mask);
  754. m_columns[column_index] = column;
  755. }
  756. for (unsigned row_index = 0; row_index < column_count; row_index++) {
  757. LLVMValueRef value = lb_emit_struct_ev(p, rhs, row_index).value;
  758. LLVMValueRef row = llvm_vector_broadcast(p, value, row_count);
  759. v_rows[row_index] = row;
  760. }
  761. GB_ASSERT(column_count > 0);
  762. LLVMValueRef vector = nullptr;
  763. for (i64 i = 0; i < column_count; i++) {
  764. if (i == 0) {
  765. vector = llvm_vector_mul(p, m_columns[i], v_rows[i]);
  766. } else {
  767. vector = llvm_vector_mul_add(p, m_columns[i], v_rows[i], vector);
  768. }
  769. }
  770. return lb_matrix_cast_vector_to_type(p, vector, type);
  771. }
  772. lbAddr res = lb_add_local_generated(p, type, true);
  773. for (i64 i = 0; i < mt->Matrix.row_count; i++) {
  774. for (i64 j = 0; j < mt->Matrix.column_count; j++) {
  775. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, 0);
  776. lbValue d0 = lb_emit_load(p, dst);
  777. lbValue a = lb_emit_matrix_ev(p, lhs, i, j);
  778. lbValue b = lb_emit_struct_ev(p, rhs, cast(i32)j);
  779. lbValue c = lb_emit_mul_add(p, a, b, d0, elem);
  780. lb_emit_store(p, dst, c);
  781. }
  782. }
  783. return lb_addr_load(p, res);
  784. }
  785. gb_internal lbValue lb_emit_vector_mul_matrix(lbProcedure *p, lbValue lhs, lbValue rhs, Type *type) {
  786. // TODO(bill): Handle edge case for f16 types on x86(-64) platforms
  787. Type *mt = base_type(rhs.type);
  788. Type *vt = base_type(lhs.type);
  789. GB_ASSERT(is_type_matrix(mt));
  790. GB_ASSERT(is_type_array_like(vt));
  791. i64 vector_count = get_array_type_count(vt);
  792. GB_ASSERT(vector_count == mt->Matrix.row_count);
  793. GB_ASSERT(are_types_identical(mt->Matrix.elem, base_array_type(vt)));
  794. Type *elem = mt->Matrix.elem;
  795. if (!mt->Matrix.is_row_major && lb_is_matrix_simdable(mt)) {
  796. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  797. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  798. unsigned column_count = cast(unsigned)mt->Matrix.column_count; gb_unused(column_count);
  799. auto m_columns = slice_make<LLVMValueRef>(permanent_allocator(), row_count);
  800. auto v_rows = slice_make<LLVMValueRef>(permanent_allocator(), row_count);
  801. LLVMValueRef matrix_vector = lb_matrix_to_vector(p, rhs);
  802. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  803. for (unsigned row_index = 0; row_index < row_count; row_index++) {
  804. for (unsigned column_index = 0; column_index < column_count; column_index++) {
  805. unsigned offset = row_index + column_index*stride;
  806. mask_elems[column_index] = lb_const_int(p->module, t_u32, offset).value;
  807. }
  808. // transpose mask
  809. LLVMValueRef mask = LLVMConstVector(mask_elems.data, column_count);
  810. LLVMValueRef column = llvm_basic_shuffle(p, matrix_vector, mask);
  811. m_columns[row_index] = column;
  812. }
  813. for (unsigned column_index = 0; column_index < row_count; column_index++) {
  814. LLVMValueRef value = lb_emit_struct_ev(p, lhs, column_index).value;
  815. LLVMValueRef row = llvm_vector_broadcast(p, value, column_count);
  816. v_rows[column_index] = row;
  817. }
  818. GB_ASSERT(row_count > 0);
  819. LLVMValueRef vector = nullptr;
  820. for (i64 i = 0; i < row_count; i++) {
  821. if (i == 0) {
  822. vector = llvm_vector_mul(p, v_rows[i], m_columns[i]);
  823. } else {
  824. vector = llvm_vector_mul_add(p, v_rows[i], m_columns[i], vector);
  825. }
  826. }
  827. lbAddr res = lb_add_local_generated(p, type, true);
  828. LLVMValueRef res_ptr = res.addr.value;
  829. unsigned alignment = cast(unsigned)gb_max(type_align_of(type), lb_alignof(LLVMTypeOf(vector)));
  830. LLVMSetAlignment(res_ptr, alignment);
  831. res_ptr = LLVMBuildPointerCast(p->builder, res_ptr, LLVMPointerType(LLVMTypeOf(vector), 0), "");
  832. LLVMBuildStore(p->builder, vector, res_ptr);
  833. return lb_addr_load(p, res);
  834. }
  835. lbAddr res = lb_add_local_generated(p, type, true);
  836. for (i64 j = 0; j < mt->Matrix.column_count; j++) {
  837. for (i64 k = 0; k < mt->Matrix.row_count; k++) {
  838. lbValue dst = lb_emit_matrix_epi(p, res.addr, 0, j);
  839. lbValue d0 = lb_emit_load(p, dst);
  840. lbValue a = lb_emit_struct_ev(p, lhs, cast(i32)k);
  841. lbValue b = lb_emit_matrix_ev(p, rhs, k, j);
  842. lbValue c = lb_emit_mul_add(p, a, b, d0, elem);
  843. lb_emit_store(p, dst, c);
  844. }
  845. }
  846. return lb_addr_load(p, res);
  847. }
  848. gb_internal lbValue lb_emit_arith_matrix(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type, bool component_wise) {
  849. GB_ASSERT(is_type_matrix(lhs.type) || is_type_matrix(rhs.type));
  850. if (op == Token_Mul && !component_wise) {
  851. Type *xt = base_type(lhs.type);
  852. Type *yt = base_type(rhs.type);
  853. if (xt->kind == Type_Matrix) {
  854. if (yt->kind == Type_Matrix) {
  855. return lb_emit_matrix_mul(p, lhs, rhs, type);
  856. } else if (is_type_array_like(yt)) {
  857. return lb_emit_matrix_mul_vector(p, lhs, rhs, type);
  858. }
  859. } else if (is_type_array_like(xt)) {
  860. GB_ASSERT(yt->kind == Type_Matrix);
  861. return lb_emit_vector_mul_matrix(p, lhs, rhs, type);
  862. } else {
  863. GB_ASSERT(xt->kind == Type_Basic);
  864. GB_ASSERT(yt->kind == Type_Matrix);
  865. GB_ASSERT(is_type_matrix(type));
  866. Type *array_type = alloc_type_array(yt->Matrix.elem, matrix_type_total_internal_elems(yt));
  867. GB_ASSERT(type_size_of(array_type) == type_size_of(yt));
  868. lbValue array_lhs = lb_emit_conv(p, lhs, array_type);
  869. lbValue array_rhs = rhs;
  870. array_rhs.type = array_type;
  871. lbValue array = lb_emit_arith(p, op, array_lhs, array_rhs, array_type);
  872. array.type = type;
  873. return array;
  874. }
  875. } else {
  876. if (is_type_matrix(lhs.type)) {
  877. rhs = lb_emit_conv(p, rhs, lhs.type);
  878. } else {
  879. lhs = lb_emit_conv(p, lhs, rhs.type);
  880. }
  881. Type *xt = base_type(lhs.type);
  882. Type *yt = base_type(rhs.type);
  883. GB_ASSERT_MSG(are_types_identical(xt, yt), "%s %.*s %s", type_to_string(lhs.type), LIT(token_strings[op]), type_to_string(rhs.type));
  884. GB_ASSERT(xt->kind == Type_Matrix);
  885. // element-wise arithmetic
  886. // pretend it is an array
  887. lbValue array_lhs = lhs;
  888. lbValue array_rhs = rhs;
  889. Type *array_type = alloc_type_array(xt->Matrix.elem, matrix_type_total_internal_elems(xt));
  890. GB_ASSERT(type_size_of(array_type) == type_size_of(xt));
  891. array_lhs.type = array_type;
  892. array_rhs.type = array_type;
  893. if (token_is_comparison(op)) {
  894. lbValue res = lb_emit_comp(p, op, array_lhs, array_rhs);
  895. return lb_emit_conv(p, res, type);
  896. } else {
  897. lbValue array = lb_emit_arith(p, op, array_lhs, array_rhs, array_type);
  898. array.type = type;
  899. return array;
  900. }
  901. }
  902. GB_PANIC("TODO: lb_emit_arith_matrix");
  903. return {};
  904. }
  905. gb_internal lbValue lb_emit_arith(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type) {
  906. if (is_type_array_like(lhs.type) || is_type_array_like(rhs.type)) {
  907. return lb_emit_arith_array(p, op, lhs, rhs, type);
  908. } else if (is_type_matrix(lhs.type) || is_type_matrix(rhs.type)) {
  909. return lb_emit_arith_matrix(p, op, lhs, rhs, type, false);
  910. } else if (is_type_complex(type)) {
  911. lhs = lb_emit_conv(p, lhs, type);
  912. rhs = lb_emit_conv(p, rhs, type);
  913. Type *ft = base_complex_elem_type(type);
  914. if (op == Token_Quo) {
  915. TEMPORARY_ALLOCATOR_GUARD();
  916. auto args = array_make<lbValue>(temporary_allocator(), 2);
  917. args[0] = lhs;
  918. args[1] = rhs;
  919. switch (type_size_of(ft)) {
  920. case 2: return lb_emit_runtime_call(p, "quo_complex32", args);
  921. case 4: return lb_emit_runtime_call(p, "quo_complex64", args);
  922. case 8: return lb_emit_runtime_call(p, "quo_complex128", args);
  923. default: GB_PANIC("Unknown float type"); break;
  924. }
  925. }
  926. lbAddr res = lb_add_local_generated(p, type, false); // NOTE: initialized in full later
  927. lbValue a = lb_emit_struct_ev(p, lhs, 0);
  928. lbValue b = lb_emit_struct_ev(p, lhs, 1);
  929. lbValue c = lb_emit_struct_ev(p, rhs, 0);
  930. lbValue d = lb_emit_struct_ev(p, rhs, 1);
  931. lbValue real = {};
  932. lbValue imag = {};
  933. switch (op) {
  934. case Token_Add:
  935. case Token_Sub:
  936. if (type_size_of(ft) == 2) {
  937. a = lb_emit_conv(p, a, t_f32);
  938. b = lb_emit_conv(p, b, t_f32);
  939. c = lb_emit_conv(p, c, t_f32);
  940. d = lb_emit_conv(p, d, t_f32);
  941. real = lb_emit_arith(p, op, a, c, t_f32);
  942. imag = lb_emit_arith(p, op, b, d, t_f32);
  943. real = lb_emit_conv(p, real, ft);
  944. imag = lb_emit_conv(p, imag, ft);
  945. } else {
  946. real = lb_emit_arith(p, op, a, c, ft);
  947. imag = lb_emit_arith(p, op, b, d, ft);
  948. }
  949. break;
  950. case Token_Mul: {
  951. lbValue x = lb_emit_arith(p, Token_Mul, a, c, ft);
  952. lbValue y = lb_emit_arith(p, Token_Mul, b, d, ft);
  953. real = lb_emit_arith(p, Token_Sub, x, y, ft);
  954. lbValue z = lb_emit_arith(p, Token_Mul, b, c, ft);
  955. lbValue w = lb_emit_arith(p, Token_Mul, a, d, ft);
  956. imag = lb_emit_arith(p, Token_Add, z, w, ft);
  957. break;
  958. }
  959. }
  960. lb_emit_store(p, lb_emit_struct_ep(p, res.addr, 0), real);
  961. lb_emit_store(p, lb_emit_struct_ep(p, res.addr, 1), imag);
  962. return lb_addr_load(p, res);
  963. } else if (is_type_quaternion(type)) {
  964. lhs = lb_emit_conv(p, lhs, type);
  965. rhs = lb_emit_conv(p, rhs, type);
  966. Type *ft = base_complex_elem_type(type);
  967. if (op == Token_Add || op == Token_Sub) {
  968. Type *immediate_type = ft;
  969. if (type_size_of(ft) == 2) {
  970. immediate_type = t_f32;
  971. }
  972. lbAddr res = lb_add_local_generated(p, type, false); // NOTE: initialized in full later
  973. lbValue x0 = lb_emit_struct_ev(p, lhs, 0);
  974. lbValue x1 = lb_emit_struct_ev(p, lhs, 1);
  975. lbValue x2 = lb_emit_struct_ev(p, lhs, 2);
  976. lbValue x3 = lb_emit_struct_ev(p, lhs, 3);
  977. lbValue y0 = lb_emit_struct_ev(p, rhs, 0);
  978. lbValue y1 = lb_emit_struct_ev(p, rhs, 1);
  979. lbValue y2 = lb_emit_struct_ev(p, rhs, 2);
  980. lbValue y3 = lb_emit_struct_ev(p, rhs, 3);
  981. if (immediate_type != ft) {
  982. x0 = lb_emit_conv(p, x0, immediate_type);
  983. x1 = lb_emit_conv(p, x1, immediate_type);
  984. x2 = lb_emit_conv(p, x2, immediate_type);
  985. x3 = lb_emit_conv(p, x3, immediate_type);
  986. y0 = lb_emit_conv(p, y0, immediate_type);
  987. y1 = lb_emit_conv(p, y1, immediate_type);
  988. y2 = lb_emit_conv(p, y2, immediate_type);
  989. y3 = lb_emit_conv(p, y3, immediate_type);
  990. }
  991. lbValue z0 = lb_emit_arith(p, op, x0, y0, immediate_type);
  992. lbValue z1 = lb_emit_arith(p, op, x1, y1, immediate_type);
  993. lbValue z2 = lb_emit_arith(p, op, x2, y2, immediate_type);
  994. lbValue z3 = lb_emit_arith(p, op, x3, y3, immediate_type);
  995. lbValue d0 = lb_emit_struct_ep(p, res.addr, 0);
  996. lbValue d1 = lb_emit_struct_ep(p, res.addr, 1);
  997. lbValue d2 = lb_emit_struct_ep(p, res.addr, 2);
  998. lbValue d3 = lb_emit_struct_ep(p, res.addr, 3);
  999. if (immediate_type != ft) {
  1000. z0 = lb_emit_conv(p, z0, ft);
  1001. z1 = lb_emit_conv(p, z1, ft);
  1002. z2 = lb_emit_conv(p, z2, ft);
  1003. z3 = lb_emit_conv(p, z3, ft);
  1004. }
  1005. lb_emit_store(p, d0, z0);
  1006. lb_emit_store(p, d1, z1);
  1007. lb_emit_store(p, d2, z2);
  1008. lb_emit_store(p, d3, z3);
  1009. return lb_addr_load(p, res);
  1010. } else if (op == Token_Mul) {
  1011. TEMPORARY_ALLOCATOR_GUARD();
  1012. auto args = array_make<lbValue>(temporary_allocator(), 2);
  1013. args[0] = lhs;
  1014. args[1] = rhs;
  1015. switch (8*type_size_of(ft)) {
  1016. case 16: return lb_emit_runtime_call(p, "mul_quaternion64", args);
  1017. case 32: return lb_emit_runtime_call(p, "mul_quaternion128", args);
  1018. case 64: return lb_emit_runtime_call(p, "mul_quaternion256", args);
  1019. default: GB_PANIC("Unknown float type"); break;
  1020. }
  1021. } else if (op == Token_Quo) {
  1022. TEMPORARY_ALLOCATOR_GUARD();
  1023. auto args = array_make<lbValue>(temporary_allocator(), 2);
  1024. args[0] = lhs;
  1025. args[1] = rhs;
  1026. switch (8*type_size_of(ft)) {
  1027. case 16: return lb_emit_runtime_call(p, "quo_quaternion64", args);
  1028. case 32: return lb_emit_runtime_call(p, "quo_quaternion128", args);
  1029. case 64: return lb_emit_runtime_call(p, "quo_quaternion256", args);
  1030. default: GB_PANIC("Unknown float type"); break;
  1031. }
  1032. }
  1033. }
  1034. lhs = lb_emit_conv(p, lhs, type);
  1035. rhs = lb_emit_conv(p, rhs, type);
  1036. if (is_type_integer(type) && is_type_different_to_arch_endianness(type)) {
  1037. switch (op) {
  1038. case Token_AndNot:
  1039. case Token_And:
  1040. case Token_Or:
  1041. case Token_Xor:
  1042. goto handle_op;
  1043. }
  1044. Type *platform_type = integer_endian_type_to_platform_type(type);
  1045. lbValue x = lb_emit_byte_swap(p, lhs, integer_endian_type_to_platform_type(lhs.type));
  1046. lbValue y = lb_emit_byte_swap(p, rhs, integer_endian_type_to_platform_type(rhs.type));
  1047. lbValue res = lb_emit_arith(p, op, x, y, platform_type);
  1048. return lb_emit_byte_swap(p, res, type);
  1049. }
  1050. if (is_type_float(type) && is_type_different_to_arch_endianness(type)) {
  1051. Type *platform_type = integer_endian_type_to_platform_type(type);
  1052. lbValue x = lb_emit_conv(p, lhs, integer_endian_type_to_platform_type(lhs.type));
  1053. lbValue y = lb_emit_conv(p, rhs, integer_endian_type_to_platform_type(rhs.type));
  1054. lbValue res = lb_emit_arith(p, op, x, y, platform_type);
  1055. return lb_emit_byte_swap(p, res, type);
  1056. }
  1057. handle_op:;
  1058. lbValue res = {};
  1059. res.type = type;
  1060. // NOTE(bill): Bit Set Aliases for + and -
  1061. if (is_type_bit_set(type)) {
  1062. switch (op) {
  1063. case Token_Add: op = Token_Or; break;
  1064. case Token_Sub: op = Token_AndNot; break;
  1065. }
  1066. Type *u = bit_set_to_int(type);
  1067. if (is_type_array(u)) {
  1068. lhs.type = u;
  1069. rhs.type = u;
  1070. res = lb_emit_arith(p, op, lhs, rhs, u);
  1071. res.type = type;
  1072. return res;
  1073. }
  1074. }
  1075. Type *integral_type = type;
  1076. if (is_type_simd_vector(integral_type)) {
  1077. integral_type = core_array_type(integral_type);
  1078. }
  1079. switch (op) {
  1080. case Token_Add:
  1081. if (is_type_float(integral_type)) {
  1082. res.value = LLVMBuildFAdd(p->builder, lhs.value, rhs.value, "");
  1083. return res;
  1084. }
  1085. res.value = LLVMBuildAdd(p->builder, lhs.value, rhs.value, "");
  1086. return res;
  1087. case Token_Sub:
  1088. if (is_type_float(integral_type)) {
  1089. res.value = LLVMBuildFSub(p->builder, lhs.value, rhs.value, "");
  1090. return res;
  1091. }
  1092. res.value = LLVMBuildSub(p->builder, lhs.value, rhs.value, "");
  1093. return res;
  1094. case Token_Mul:
  1095. if (is_type_float(integral_type)) {
  1096. res.value = LLVMBuildFMul(p->builder, lhs.value, rhs.value, "");
  1097. return res;
  1098. }
  1099. res.value = LLVMBuildMul(p->builder, lhs.value, rhs.value, "");
  1100. return res;
  1101. case Token_Quo:
  1102. if (is_type_float(integral_type)) {
  1103. res.value = LLVMBuildFDiv(p->builder, lhs.value, rhs.value, "");
  1104. return res;
  1105. } else if (is_type_unsigned(integral_type)) {
  1106. res.value = LLVMBuildUDiv(p->builder, lhs.value, rhs.value, "");
  1107. return res;
  1108. }
  1109. res.value = LLVMBuildSDiv(p->builder, lhs.value, rhs.value, "");
  1110. return res;
  1111. case Token_Mod:
  1112. if (is_type_float(integral_type)) {
  1113. res.value = LLVMBuildFRem(p->builder, lhs.value, rhs.value, "");
  1114. return res;
  1115. } else if (is_type_unsigned(integral_type)) {
  1116. res.value = LLVMBuildURem(p->builder, lhs.value, rhs.value, "");
  1117. return res;
  1118. }
  1119. res.value = LLVMBuildSRem(p->builder, lhs.value, rhs.value, "");
  1120. return res;
  1121. case Token_ModMod:
  1122. if (is_type_unsigned(integral_type)) {
  1123. res.value = LLVMBuildURem(p->builder, lhs.value, rhs.value, "");
  1124. return res;
  1125. } else {
  1126. LLVMValueRef a = LLVMBuildSRem(p->builder, lhs.value, rhs.value, "");
  1127. LLVMValueRef b = LLVMBuildAdd(p->builder, a, rhs.value, "");
  1128. LLVMValueRef c = LLVMBuildSRem(p->builder, b, rhs.value, "");
  1129. res.value = c;
  1130. return res;
  1131. }
  1132. case Token_And:
  1133. res.value = LLVMBuildAnd(p->builder, lhs.value, rhs.value, "");
  1134. return res;
  1135. case Token_Or:
  1136. res.value = LLVMBuildOr(p->builder, lhs.value, rhs.value, "");
  1137. return res;
  1138. case Token_Xor:
  1139. res.value = LLVMBuildXor(p->builder, lhs.value, rhs.value, "");
  1140. return res;
  1141. case Token_Shl:
  1142. {
  1143. rhs = lb_emit_conv(p, rhs, lhs.type);
  1144. LLVMValueRef lhsval = lhs.value;
  1145. LLVMValueRef bits = rhs.value;
  1146. LLVMValueRef bit_size = LLVMConstInt(lb_type(p->module, rhs.type), 8*type_size_of(lhs.type), false);
  1147. LLVMValueRef width_test = LLVMBuildICmp(p->builder, LLVMIntULT, bits, bit_size, "");
  1148. res.value = LLVMBuildShl(p->builder, lhsval, bits, "");
  1149. LLVMValueRef zero = LLVMConstNull(lb_type(p->module, lhs.type));
  1150. res.value = LLVMBuildSelect(p->builder, width_test, res.value, zero, "");
  1151. return res;
  1152. }
  1153. case Token_Shr:
  1154. {
  1155. rhs = lb_emit_conv(p, rhs, lhs.type);
  1156. LLVMValueRef lhsval = lhs.value;
  1157. LLVMValueRef bits = rhs.value;
  1158. bool is_unsigned = is_type_unsigned(integral_type);
  1159. LLVMValueRef bit_size = LLVMConstInt(lb_type(p->module, rhs.type), 8*type_size_of(lhs.type), false);
  1160. LLVMValueRef width_test = LLVMBuildICmp(p->builder, LLVMIntULT, bits, bit_size, "");
  1161. if (is_unsigned) {
  1162. res.value = LLVMBuildLShr(p->builder, lhsval, bits, "");
  1163. } else {
  1164. res.value = LLVMBuildAShr(p->builder, lhsval, bits, "");
  1165. }
  1166. LLVMValueRef zero = LLVMConstNull(lb_type(p->module, lhs.type));
  1167. res.value = LLVMBuildSelect(p->builder, width_test, res.value, zero, "");
  1168. return res;
  1169. }
  1170. case Token_AndNot:
  1171. {
  1172. LLVMValueRef new_rhs = LLVMBuildNot(p->builder, rhs.value, "");
  1173. res.value = LLVMBuildAnd(p->builder, lhs.value, new_rhs, "");
  1174. return res;
  1175. }
  1176. break;
  1177. }
  1178. GB_PANIC("unhandled operator of lb_emit_arith");
  1179. return {};
  1180. }
  1181. gb_internal bool lb_is_empty_string_constant(Ast *expr) {
  1182. if (expr->tav.value.kind == ExactValue_String &&
  1183. is_type_string(expr->tav.type)) {
  1184. String s = expr->tav.value.value_string;
  1185. return s.len == 0;
  1186. }
  1187. return false;
  1188. }
  1189. gb_internal lbValue lb_build_binary_in(lbProcedure *p, lbValue left, lbValue right, TokenKind op) {
  1190. Type *rt = base_type(right.type);
  1191. if (is_type_pointer(rt)) {
  1192. right = lb_emit_load(p, right);
  1193. rt = base_type(type_deref(rt));
  1194. }
  1195. switch (rt->kind) {
  1196. case Type_Map:
  1197. {
  1198. lbValue map_ptr = lb_address_from_load_or_generate_local(p, right);
  1199. lbValue key = left;
  1200. lbValue ptr = lb_internal_dynamic_map_get_ptr(p, map_ptr, key);
  1201. if (op == Token_in) {
  1202. return lb_emit_conv(p, lb_emit_comp_against_nil(p, Token_NotEq, ptr), t_bool);
  1203. } else {
  1204. return lb_emit_conv(p, lb_emit_comp_against_nil(p, Token_CmpEq, ptr), t_bool);
  1205. }
  1206. }
  1207. break;
  1208. case Type_BitSet:
  1209. {
  1210. Type *key_type = rt->BitSet.elem;
  1211. GB_ASSERT(are_types_identical(left.type, key_type));
  1212. Type *it = bit_set_to_int(rt);
  1213. left = lb_emit_conv(p, left, it);
  1214. if (is_type_different_to_arch_endianness(it)) {
  1215. left = lb_emit_byte_swap(p, left, integer_endian_type_to_platform_type(it));
  1216. }
  1217. lbValue lower = lb_const_value(p->module, left.type, exact_value_i64(rt->BitSet.lower));
  1218. lbValue key = lb_emit_arith(p, Token_Sub, left, lower, left.type);
  1219. lbValue bit = lb_emit_arith(p, Token_Shl, lb_const_int(p->module, left.type, 1), key, left.type);
  1220. bit = lb_emit_conv(p, bit, it);
  1221. lbValue old_value = lb_emit_transmute(p, right, it);
  1222. lbValue new_value = lb_emit_arith(p, Token_And, old_value, bit, it);
  1223. if (op == Token_in) {
  1224. return lb_emit_conv(p, lb_emit_comp(p, Token_NotEq, new_value, lb_const_int(p->module, new_value.type, 0)), t_bool);
  1225. } else {
  1226. return lb_emit_conv(p, lb_emit_comp(p, Token_CmpEq, new_value, lb_const_int(p->module, new_value.type, 0)), t_bool);
  1227. }
  1228. }
  1229. break;
  1230. }
  1231. GB_PANIC("Invalid 'in' type");
  1232. return {};
  1233. }
  1234. gb_internal lbValue lb_build_binary_expr(lbProcedure *p, Ast *expr) {
  1235. ast_node(be, BinaryExpr, expr);
  1236. TypeAndValue tv = type_and_value_of_expr(expr);
  1237. if (is_type_matrix(be->left->tav.type) || is_type_matrix(be->right->tav.type)) {
  1238. lbValue left = lb_build_expr(p, be->left);
  1239. lbValue right = lb_build_expr(p, be->right);
  1240. return lb_emit_arith_matrix(p, be->op.kind, left, right, default_type(tv.type), false);
  1241. }
  1242. switch (be->op.kind) {
  1243. case Token_Add:
  1244. case Token_Sub:
  1245. case Token_Mul:
  1246. case Token_Quo:
  1247. case Token_Mod:
  1248. case Token_ModMod:
  1249. case Token_And:
  1250. case Token_Or:
  1251. case Token_Xor:
  1252. case Token_AndNot: {
  1253. Type *type = default_type(tv.type);
  1254. lbValue left = lb_build_expr(p, be->left);
  1255. lbValue right = lb_build_expr(p, be->right);
  1256. return lb_emit_arith(p, be->op.kind, left, right, type);
  1257. }
  1258. case Token_Shl:
  1259. case Token_Shr: {
  1260. lbValue left, right;
  1261. Type *type = default_type(tv.type);
  1262. left = lb_build_expr(p, be->left);
  1263. if (lb_is_expr_untyped_const(be->right)) {
  1264. // NOTE(bill): RHS shift operands can still be untyped
  1265. // Just bypass the standard lb_build_expr
  1266. right = lb_expr_untyped_const_to_typed(p->module, be->right, type);
  1267. } else {
  1268. right = lb_build_expr(p, be->right);
  1269. }
  1270. return lb_emit_arith(p, be->op.kind, left, right, type);
  1271. }
  1272. case Token_CmpEq:
  1273. case Token_NotEq:
  1274. if (is_type_untyped_nil(be->right->tav.type)) {
  1275. // `x == nil` or `x != nil`
  1276. lbValue left = lb_build_expr(p, be->left);
  1277. lbValue cmp = lb_emit_comp_against_nil(p, be->op.kind, left);
  1278. Type *type = default_type(tv.type);
  1279. return lb_emit_conv(p, cmp, type);
  1280. } else if (is_type_untyped_nil(be->left->tav.type)) {
  1281. // `nil == x` or `nil != x`
  1282. lbValue right = lb_build_expr(p, be->right);
  1283. lbValue cmp = lb_emit_comp_against_nil(p, be->op.kind, right);
  1284. Type *type = default_type(tv.type);
  1285. return lb_emit_conv(p, cmp, type);
  1286. } else if (lb_is_empty_string_constant(be->right)) {
  1287. // `x == ""` or `x != ""`
  1288. lbValue s = lb_build_expr(p, be->left);
  1289. s = lb_emit_conv(p, s, t_string);
  1290. lbValue len = lb_string_len(p, s);
  1291. lbValue cmp = lb_emit_comp(p, be->op.kind, len, lb_const_int(p->module, t_int, 0));
  1292. Type *type = default_type(tv.type);
  1293. return lb_emit_conv(p, cmp, type);
  1294. } else if (lb_is_empty_string_constant(be->left)) {
  1295. // `"" == x` or `"" != x`
  1296. lbValue s = lb_build_expr(p, be->right);
  1297. s = lb_emit_conv(p, s, t_string);
  1298. lbValue len = lb_string_len(p, s);
  1299. lbValue cmp = lb_emit_comp(p, be->op.kind, len, lb_const_int(p->module, t_int, 0));
  1300. Type *type = default_type(tv.type);
  1301. return lb_emit_conv(p, cmp, type);
  1302. }
  1303. /*fallthrough*/
  1304. case Token_Lt:
  1305. case Token_LtEq:
  1306. case Token_Gt:
  1307. case Token_GtEq:
  1308. {
  1309. lbValue left = {};
  1310. lbValue right = {};
  1311. if (be->left->tav.mode == Addressing_Type) {
  1312. left = lb_typeid(p->module, be->left->tav.type);
  1313. }
  1314. if (be->right->tav.mode == Addressing_Type) {
  1315. right = lb_typeid(p->module, be->right->tav.type);
  1316. }
  1317. if (left.value == nullptr) left = lb_build_expr(p, be->left);
  1318. if (right.value == nullptr) right = lb_build_expr(p, be->right);
  1319. lbValue cmp = lb_emit_comp(p, be->op.kind, left, right);
  1320. Type *type = default_type(tv.type);
  1321. return lb_emit_conv(p, cmp, type);
  1322. }
  1323. case Token_CmpAnd:
  1324. case Token_CmpOr:
  1325. return lb_emit_logical_binary_expr(p, be->op.kind, be->left, be->right, tv.type);
  1326. case Token_in:
  1327. case Token_not_in:
  1328. {
  1329. lbValue left = lb_build_expr(p, be->left);
  1330. lbValue right = lb_build_expr(p, be->right);
  1331. return lb_build_binary_in(p, left, right, be->op.kind);
  1332. }
  1333. default:
  1334. GB_PANIC("Invalid binary expression");
  1335. break;
  1336. }
  1337. return {};
  1338. }
  1339. gb_internal lbValue lb_emit_conv(lbProcedure *p, lbValue value, Type *t) {
  1340. lbModule *m = p->module;
  1341. t = reduce_tuple_to_single_type(t);
  1342. Type *src_type = value.type;
  1343. if (are_types_identical(t, src_type)) {
  1344. return value;
  1345. }
  1346. Type *src = core_type(src_type);
  1347. Type *dst = core_type(t);
  1348. GB_ASSERT(src != nullptr);
  1349. GB_ASSERT(dst != nullptr);
  1350. if (is_type_untyped_uninit(src)) {
  1351. return lb_const_undef(m, t);
  1352. }
  1353. if (is_type_untyped_nil(src)) {
  1354. return lb_const_nil(m, t);
  1355. }
  1356. if (LLVMIsConstant(value.value)) {
  1357. if (is_type_any(dst)) {
  1358. Type *st = default_type(src_type);
  1359. lbAddr default_value = lb_add_local_generated(p, st, false);
  1360. lb_addr_store(p, default_value, value);
  1361. lbValue data = lb_emit_conv(p, default_value.addr, t_rawptr);
  1362. lbValue id = lb_typeid(m, st);
  1363. lbAddr res = lb_add_local_generated(p, t, false);
  1364. lbValue a0 = lb_emit_struct_ep(p, res.addr, 0);
  1365. lbValue a1 = lb_emit_struct_ep(p, res.addr, 1);
  1366. lb_emit_store(p, a0, data);
  1367. lb_emit_store(p, a1, id);
  1368. return lb_addr_load(p, res);
  1369. } else if (dst->kind == Type_Basic) {
  1370. if (src->Basic.kind == Basic_string && dst->Basic.kind == Basic_cstring) {
  1371. String str = lb_get_const_string(m, value);
  1372. lbValue res = {};
  1373. res.type = t;
  1374. res.value = llvm_cstring(m, str);
  1375. return res;
  1376. }
  1377. // if (is_type_float(dst)) {
  1378. // return value;
  1379. // } else if (is_type_integer(dst)) {
  1380. // return value;
  1381. // }
  1382. // ExactValue ev = value->Constant.value;
  1383. // if (is_type_float(dst)) {
  1384. // ev = exact_value_to_float(ev);
  1385. // } else if (is_type_complex(dst)) {
  1386. // ev = exact_value_to_complex(ev);
  1387. // } else if (is_type_quaternion(dst)) {
  1388. // ev = exact_value_to_quaternion(ev);
  1389. // } else if (is_type_string(dst)) {
  1390. // // Handled elsewhere
  1391. // GB_ASSERT_MSG(ev.kind == ExactValue_String, "%d", ev.kind);
  1392. // } else if (is_type_integer(dst)) {
  1393. // ev = exact_value_to_integer(ev);
  1394. // } else if (is_type_pointer(dst)) {
  1395. // // IMPORTANT NOTE(bill): LLVM doesn't support pointer constants expect 'null'
  1396. // lbValue i = lb_add_module_constant(p->module, t_uintptr, ev);
  1397. // return lb_emit(p, lb_instr_conv(p, irConv_inttoptr, i, t_uintptr, dst));
  1398. // }
  1399. // return lb_const_value(p->module, t, ev);
  1400. }
  1401. }
  1402. if (are_types_identical(src, dst)) {
  1403. if (!are_types_identical(src_type, t)) {
  1404. return lb_emit_transmute(p, value, t);
  1405. }
  1406. return value;
  1407. }
  1408. // bool <-> llvm bool
  1409. if (is_type_boolean(src) && dst == t_llvm_bool) {
  1410. lbValue res = {};
  1411. res.value = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(lb_type(m, src)), "");
  1412. res.type = t;
  1413. return res;
  1414. }
  1415. if (src == t_llvm_bool && is_type_boolean(dst)) {
  1416. lbValue res = {};
  1417. res.value = LLVMBuildZExt(p->builder, value.value, lb_type(m, dst), "");
  1418. res.type = t;
  1419. return res;
  1420. }
  1421. // integer -> integer
  1422. if (is_type_integer(src) && is_type_integer(dst)) {
  1423. GB_ASSERT(src->kind == Type_Basic &&
  1424. dst->kind == Type_Basic);
  1425. i64 sz = type_size_of(default_type(src));
  1426. i64 dz = type_size_of(default_type(dst));
  1427. if (sz == dz) {
  1428. if (dz > 1 && !types_have_same_internal_endian(src, dst)) {
  1429. return lb_emit_byte_swap(p, value, t);
  1430. }
  1431. lbValue res = {};
  1432. res.value = value.value;
  1433. res.type = t;
  1434. return res;
  1435. }
  1436. if (sz > 1 && is_type_different_to_arch_endianness(src)) {
  1437. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1438. value = lb_emit_byte_swap(p, value, platform_src_type);
  1439. }
  1440. LLVMOpcode op = LLVMTrunc;
  1441. if (dz < sz) {
  1442. op = LLVMTrunc;
  1443. } else if (dz == sz) {
  1444. // NOTE(bill): In LLVM, all integers are signed and rely upon 2's compliment
  1445. // NOTE(bill): Copy the value just for type correctness
  1446. op = LLVMBitCast;
  1447. } else if (dz > sz) {
  1448. op = is_type_unsigned(src) ? LLVMZExt : LLVMSExt; // zero extent
  1449. }
  1450. if (dz > 1 && is_type_different_to_arch_endianness(dst)) {
  1451. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1452. lbValue res = {};
  1453. res.value = LLVMBuildCast(p->builder, op, value.value, lb_type(m, platform_dst_type), "");
  1454. res.type = t;
  1455. return lb_emit_byte_swap(p, res, t);
  1456. } else {
  1457. lbValue res = {};
  1458. res.value = LLVMBuildCast(p->builder, op, value.value, lb_type(m, t), "");
  1459. res.type = t;
  1460. return res;
  1461. }
  1462. }
  1463. // boolean -> boolean/integer
  1464. if (is_type_boolean(src) && (is_type_boolean(dst) || is_type_integer(dst))) {
  1465. LLVMValueRef b = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(lb_type(m, value.type)), "");
  1466. lbValue res = {};
  1467. res.value = LLVMBuildIntCast2(p->builder, b, lb_type(m, t), false, "");
  1468. res.type = t;
  1469. return res;
  1470. }
  1471. if (is_type_cstring(src) && is_type_u8_ptr(dst)) {
  1472. return lb_emit_transmute(p, value, dst);
  1473. }
  1474. if (is_type_u8_ptr(src) && is_type_cstring(dst)) {
  1475. return lb_emit_transmute(p, value, dst);
  1476. }
  1477. if (is_type_cstring(src) && is_type_u8_multi_ptr(dst)) {
  1478. return lb_emit_transmute(p, value, dst);
  1479. }
  1480. if (is_type_u8_multi_ptr(src) && is_type_cstring(dst)) {
  1481. return lb_emit_transmute(p, value, dst);
  1482. }
  1483. if (is_type_cstring(src) && is_type_rawptr(dst)) {
  1484. return lb_emit_transmute(p, value, dst);
  1485. }
  1486. if (is_type_rawptr(src) && is_type_cstring(dst)) {
  1487. return lb_emit_transmute(p, value, dst);
  1488. }
  1489. if (are_types_identical(src, t_cstring) && are_types_identical(dst, t_string)) {
  1490. TEMPORARY_ALLOCATOR_GUARD();
  1491. lbValue c = lb_emit_conv(p, value, t_cstring);
  1492. auto args = array_make<lbValue>(temporary_allocator(), 1);
  1493. args[0] = c;
  1494. lbValue s = lb_emit_runtime_call(p, "cstring_to_string", args);
  1495. return lb_emit_conv(p, s, dst);
  1496. }
  1497. // integer -> boolean
  1498. if (is_type_integer(src) && is_type_boolean(dst)) {
  1499. lbValue res = {};
  1500. res.value = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(lb_type(m, value.type)), "");
  1501. res.type = t_llvm_bool;
  1502. return lb_emit_conv(p, res, t);
  1503. }
  1504. // float -> float
  1505. if (is_type_float(src) && is_type_float(dst)) {
  1506. i64 sz = type_size_of(src);
  1507. i64 dz = type_size_of(dst);
  1508. if (dz == sz) {
  1509. if (types_have_same_internal_endian(src, dst)) {
  1510. lbValue res = {};
  1511. res.type = t;
  1512. res.value = value.value;
  1513. return res;
  1514. } else {
  1515. return lb_emit_byte_swap(p, value, t);
  1516. }
  1517. }
  1518. if (is_type_different_to_arch_endianness(src) || is_type_different_to_arch_endianness(dst)) {
  1519. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1520. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1521. lbValue res = {};
  1522. res = lb_emit_conv(p, value, platform_src_type);
  1523. res = lb_emit_conv(p, res, platform_dst_type);
  1524. if (is_type_different_to_arch_endianness(dst)) {
  1525. res = lb_emit_byte_swap(p, res, t);
  1526. }
  1527. return lb_emit_conv(p, res, t);
  1528. }
  1529. lbValue res = {};
  1530. res.type = t;
  1531. if (dz >= sz) {
  1532. res.value = LLVMBuildFPExt(p->builder, value.value, lb_type(m, t), "");
  1533. } else {
  1534. res.value = LLVMBuildFPTrunc(p->builder, value.value, lb_type(m, t), "");
  1535. }
  1536. return res;
  1537. }
  1538. if (is_type_complex(src) && is_type_complex(dst)) {
  1539. Type *ft = base_complex_elem_type(dst);
  1540. lbAddr gen = lb_add_local_generated(p, t, false);
  1541. lbValue gp = lb_addr_get_ptr(p, gen);
  1542. lbValue real = lb_emit_conv(p, lb_emit_struct_ev(p, value, 0), ft);
  1543. lbValue imag = lb_emit_conv(p, lb_emit_struct_ev(p, value, 1), ft);
  1544. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), real);
  1545. lb_emit_store(p, lb_emit_struct_ep(p, gp, 1), imag);
  1546. return lb_addr_load(p, gen);
  1547. }
  1548. if (is_type_quaternion(src) && is_type_quaternion(dst)) {
  1549. // @QuaternionLayout
  1550. Type *ft = base_complex_elem_type(dst);
  1551. lbAddr gen = lb_add_local_generated(p, t, false);
  1552. lbValue gp = lb_addr_get_ptr(p, gen);
  1553. lbValue q0 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 0), ft);
  1554. lbValue q1 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 1), ft);
  1555. lbValue q2 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 2), ft);
  1556. lbValue q3 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 3), ft);
  1557. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), q0);
  1558. lb_emit_store(p, lb_emit_struct_ep(p, gp, 1), q1);
  1559. lb_emit_store(p, lb_emit_struct_ep(p, gp, 2), q2);
  1560. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), q3);
  1561. return lb_addr_load(p, gen);
  1562. }
  1563. if (is_type_integer(src) && is_type_complex(dst)) {
  1564. Type *ft = base_complex_elem_type(dst);
  1565. lbAddr gen = lb_add_local_generated(p, t, true);
  1566. lbValue gp = lb_addr_get_ptr(p, gen);
  1567. lbValue real = lb_emit_conv(p, value, ft);
  1568. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), real);
  1569. return lb_addr_load(p, gen);
  1570. }
  1571. if (is_type_float(src) && is_type_complex(dst)) {
  1572. Type *ft = base_complex_elem_type(dst);
  1573. lbAddr gen = lb_add_local_generated(p, t, true);
  1574. lbValue gp = lb_addr_get_ptr(p, gen);
  1575. lbValue real = lb_emit_conv(p, value, ft);
  1576. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), real);
  1577. return lb_addr_load(p, gen);
  1578. }
  1579. if (is_type_integer(src) && is_type_quaternion(dst)) {
  1580. Type *ft = base_complex_elem_type(dst);
  1581. lbAddr gen = lb_add_local_generated(p, t, true);
  1582. lbValue gp = lb_addr_get_ptr(p, gen);
  1583. lbValue real = lb_emit_conv(p, value, ft);
  1584. // @QuaternionLayout
  1585. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), real);
  1586. return lb_addr_load(p, gen);
  1587. }
  1588. if (is_type_float(src) && is_type_quaternion(dst)) {
  1589. Type *ft = base_complex_elem_type(dst);
  1590. lbAddr gen = lb_add_local_generated(p, t, true);
  1591. lbValue gp = lb_addr_get_ptr(p, gen);
  1592. lbValue real = lb_emit_conv(p, value, ft);
  1593. // @QuaternionLayout
  1594. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), real);
  1595. return lb_addr_load(p, gen);
  1596. }
  1597. if (is_type_complex(src) && is_type_quaternion(dst)) {
  1598. Type *ft = base_complex_elem_type(dst);
  1599. lbAddr gen = lb_add_local_generated(p, t, true);
  1600. lbValue gp = lb_addr_get_ptr(p, gen);
  1601. lbValue real = lb_emit_conv(p, lb_emit_struct_ev(p, value, 0), ft);
  1602. lbValue imag = lb_emit_conv(p, lb_emit_struct_ev(p, value, 1), ft);
  1603. // @QuaternionLayout
  1604. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), real);
  1605. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), imag);
  1606. return lb_addr_load(p, gen);
  1607. }
  1608. // float <-> integer
  1609. if (is_type_float(src) && is_type_integer(dst)) {
  1610. if (is_type_different_to_arch_endianness(src) || is_type_different_to_arch_endianness(dst)) {
  1611. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1612. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1613. lbValue res = {};
  1614. res = lb_emit_conv(p, value, platform_src_type);
  1615. res = lb_emit_conv(p, res, platform_dst_type);
  1616. return lb_emit_conv(p, res, t);
  1617. }
  1618. if (is_type_integer_128bit(dst)) {
  1619. TEMPORARY_ALLOCATOR_GUARD();
  1620. auto args = array_make<lbValue>(temporary_allocator(), 1);
  1621. args[0] = value;
  1622. char const *call = "fixunsdfdi";
  1623. if (is_type_unsigned(dst)) {
  1624. call = "fixunsdfti";
  1625. }
  1626. lbValue res_i128 = lb_emit_runtime_call(p, call, args);
  1627. return lb_emit_conv(p, res_i128, t);
  1628. }
  1629. i64 sz = type_size_of(src);
  1630. lbValue res = {};
  1631. res.type = t;
  1632. if (is_type_unsigned(dst)) {
  1633. switch (sz) {
  1634. case 2:
  1635. case 4:
  1636. res.value = LLVMBuildFPToUI(p->builder, value.value, lb_type(m, t_u32), "");
  1637. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), false, "");
  1638. break;
  1639. case 8:
  1640. res.value = LLVMBuildFPToUI(p->builder, value.value, lb_type(m, t_u64), "");
  1641. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), false, "");
  1642. break;
  1643. default:
  1644. GB_PANIC("Unhandled float type");
  1645. break;
  1646. }
  1647. } else {
  1648. switch (sz) {
  1649. case 2:
  1650. case 4:
  1651. res.value = LLVMBuildFPToSI(p->builder, value.value, lb_type(m, t_i32), "");
  1652. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), true, "");
  1653. break;
  1654. case 8:
  1655. res.value = LLVMBuildFPToSI(p->builder, value.value, lb_type(m, t_i64), "");
  1656. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), true, "");
  1657. break;
  1658. default:
  1659. GB_PANIC("Unhandled float type");
  1660. break;
  1661. }
  1662. }
  1663. return res;
  1664. }
  1665. if (is_type_integer(src) && is_type_float(dst)) {
  1666. if (is_type_different_to_arch_endianness(src) || is_type_different_to_arch_endianness(dst)) {
  1667. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1668. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1669. lbValue res = {};
  1670. res = lb_emit_conv(p, value, platform_src_type);
  1671. res = lb_emit_conv(p, res, platform_dst_type);
  1672. if (is_type_different_to_arch_endianness(dst)) {
  1673. res = lb_emit_byte_swap(p, res, t);
  1674. }
  1675. return lb_emit_conv(p, res, t);
  1676. }
  1677. if (is_type_integer_128bit(src)) {
  1678. TEMPORARY_ALLOCATOR_GUARD();
  1679. auto args = array_make<lbValue>(temporary_allocator(), 1);
  1680. args[0] = value;
  1681. char const *call = "floattidf";
  1682. if (is_type_unsigned(src)) {
  1683. call = "floattidf_unsigned";
  1684. }
  1685. lbValue res_f64 = lb_emit_runtime_call(p, call, args);
  1686. return lb_emit_conv(p, res_f64, t);
  1687. }
  1688. lbValue res = {};
  1689. res.type = t;
  1690. if (is_type_unsigned(src)) {
  1691. res.value = LLVMBuildUIToFP(p->builder, value.value, lb_type(m, t), "");
  1692. } else {
  1693. res.value = LLVMBuildSIToFP(p->builder, value.value, lb_type(m, t), "");
  1694. }
  1695. return res;
  1696. }
  1697. if (is_type_simd_vector(dst)) {
  1698. Type *et = base_array_type(dst);
  1699. if (is_type_simd_vector(src)) {
  1700. Type *src_elem = core_array_type(src);
  1701. Type *dst_elem = core_array_type(dst);
  1702. GB_ASSERT(src->SimdVector.count == dst->SimdVector.count);
  1703. lbValue res = {};
  1704. res.type = t;
  1705. if (are_types_identical(src_elem, dst_elem)) {
  1706. res.value = value.value;
  1707. } else if (is_type_float(src_elem) && is_type_integer(dst_elem)) {
  1708. if (is_type_unsigned(dst_elem)) {
  1709. res.value = LLVMBuildFPToUI(p->builder, value.value, lb_type(m, t), "");
  1710. } else {
  1711. res.value = LLVMBuildFPToSI(p->builder, value.value, lb_type(m, t), "");
  1712. }
  1713. } else if (is_type_integer(src_elem) && is_type_float(dst_elem)) {
  1714. if (is_type_unsigned(src_elem)) {
  1715. res.value = LLVMBuildUIToFP(p->builder, value.value, lb_type(m, t), "");
  1716. } else {
  1717. res.value = LLVMBuildSIToFP(p->builder, value.value, lb_type(m, t), "");
  1718. }
  1719. } else if ((is_type_integer(src_elem) || is_type_boolean(src_elem)) && is_type_integer(dst_elem)) {
  1720. res.value = LLVMBuildIntCast2(p->builder, value.value, lb_type(m, t), !is_type_unsigned(src_elem), "");
  1721. } else if (is_type_float(src_elem) && is_type_float(dst_elem)) {
  1722. res.value = LLVMBuildFPCast(p->builder, value.value, lb_type(m, t), "");
  1723. } else if (is_type_integer(src_elem) && is_type_boolean(dst_elem)) {
  1724. LLVMValueRef i1vector = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(LLVMTypeOf(value.value)), "");
  1725. res.value = LLVMBuildIntCast2(p->builder, i1vector, lb_type(m, t), !is_type_unsigned(src_elem), "");
  1726. } else if (is_type_pointer(src_elem) && is_type_integer(dst_elem)) {
  1727. res.value = LLVMBuildPtrToInt(p->builder, value.value, lb_type(m, t), "");
  1728. } else if (is_type_integer(src_elem) && is_type_pointer(dst_elem)) {
  1729. res.value = LLVMBuildIntToPtr(p->builder, value.value, lb_type(m, t), "");
  1730. }else {
  1731. GB_PANIC("Unhandled simd vector conversion: %s -> %s", type_to_string(src), type_to_string(dst));
  1732. }
  1733. return res;
  1734. } else {
  1735. i64 count = get_array_type_count(dst);
  1736. LLVMTypeRef vt = lb_type(m, t);
  1737. LLVMTypeRef llvm_u32 = lb_type(m, t_u32);
  1738. LLVMValueRef elem = lb_emit_conv(p, value, et).value;
  1739. LLVMValueRef vector = LLVMConstNull(vt);
  1740. for (i64 i = 0; i < count; i++) {
  1741. LLVMValueRef idx = LLVMConstInt(llvm_u32, i, false);
  1742. vector = LLVMBuildInsertElement(p->builder, vector, elem, idx, "");
  1743. }
  1744. lbValue res = {};
  1745. res.type = t;
  1746. res.value = vector;
  1747. return res;
  1748. }
  1749. }
  1750. // bit_field <-> backing type
  1751. if (is_type_bit_field(src)) {
  1752. if (are_types_identical(src->BitField.backing_type, dst)) {
  1753. lbValue res = {};
  1754. res.type = t;
  1755. res.value = value.value;
  1756. return res;
  1757. }
  1758. }
  1759. if (is_type_bit_field(dst)) {
  1760. if (are_types_identical(src, dst->BitField.backing_type)) {
  1761. lbValue res = {};
  1762. res.type = t;
  1763. res.value = value.value;
  1764. return res;
  1765. }
  1766. }
  1767. // bit_set <-> backing type
  1768. if (is_type_bit_set(src)) {
  1769. Type *backing = bit_set_to_int(src);
  1770. if (are_types_identical(backing, dst)) {
  1771. lbValue res = {};
  1772. res.type = t;
  1773. res.value = value.value;
  1774. return res;
  1775. }
  1776. }
  1777. if (is_type_bit_set(dst)) {
  1778. Type *backing = bit_set_to_int(dst);
  1779. if (are_types_identical(src, backing)) {
  1780. lbValue res = {};
  1781. res.type = t;
  1782. res.value = value.value;
  1783. return res;
  1784. }
  1785. }
  1786. // Pointer <-> uintptr
  1787. if (is_type_pointer(src) && is_type_uintptr(dst)) {
  1788. lbValue res = {};
  1789. res.type = t;
  1790. res.value = LLVMBuildPtrToInt(p->builder, value.value, lb_type(m, t), "");
  1791. return res;
  1792. }
  1793. if (is_type_uintptr(src) && is_type_pointer(dst)) {
  1794. lbValue res = {};
  1795. res.type = t;
  1796. res.value = LLVMBuildIntToPtr(p->builder, value.value, lb_type(m, t), "");
  1797. return res;
  1798. }
  1799. if (is_type_multi_pointer(src) && is_type_uintptr(dst)) {
  1800. lbValue res = {};
  1801. res.type = t;
  1802. res.value = LLVMBuildPtrToInt(p->builder, value.value, lb_type(m, t), "");
  1803. return res;
  1804. }
  1805. if (is_type_uintptr(src) && is_type_multi_pointer(dst)) {
  1806. lbValue res = {};
  1807. res.type = t;
  1808. res.value = LLVMBuildIntToPtr(p->builder, value.value, lb_type(m, t), "");
  1809. return res;
  1810. }
  1811. if (is_type_union(dst)) {
  1812. if (dst->Union.variants.count == 1) {
  1813. Type *vt = dst->Union.variants[0];
  1814. if (internal_check_is_assignable_to(src_type, vt)) {
  1815. value = lb_emit_conv(p, value, vt);
  1816. lbAddr parent = lb_add_local_generated(p, t, true);
  1817. lb_emit_store_union_variant(p, parent.addr, value, vt);
  1818. return lb_addr_load(p, parent);
  1819. }
  1820. }
  1821. for (Type *vt : dst->Union.variants) {
  1822. if (are_types_identical(src_type, vt)) {
  1823. lbAddr parent = lb_add_local_generated(p, t, true);
  1824. lb_emit_store_union_variant(p, parent.addr, value, vt);
  1825. return lb_addr_load(p, parent);
  1826. }
  1827. }
  1828. ValidIndexAndScore *valids = gb_alloc_array(temporary_allocator(), ValidIndexAndScore, dst->Union.variants.count);
  1829. isize valid_count = 0;
  1830. isize first_success_index = -1;
  1831. for_array(i, dst->Union.variants) {
  1832. Type *vt = dst->Union.variants[i];
  1833. i64 score = 0;
  1834. if (internal_check_is_assignable_to(src_type, vt)) {
  1835. valids[valid_count].index = i;
  1836. valids[valid_count].score = score;
  1837. valid_count += 1;
  1838. if (first_success_index < 0) {
  1839. first_success_index = i;
  1840. }
  1841. }
  1842. }
  1843. if (valid_count > 1) {
  1844. gb_sort_array(valids, valid_count, valid_index_and_score_cmp);
  1845. i64 best_score = valids[0].score;
  1846. for (isize i = 1; i < valid_count; i++) {
  1847. auto v = valids[i];
  1848. if (best_score > v.score) {
  1849. valid_count = i;
  1850. break;
  1851. }
  1852. best_score = v.score;
  1853. }
  1854. first_success_index = valids[0].index;
  1855. }
  1856. if (valid_count == 1) {
  1857. Type *vt = dst->Union.variants[first_success_index];
  1858. value = lb_emit_conv(p, value, vt);
  1859. lbAddr parent = lb_add_local_generated(p, t, true);
  1860. lb_emit_store_union_variant(p, parent.addr, value, vt);
  1861. return lb_addr_load(p, parent);
  1862. }
  1863. }
  1864. // NOTE(bill): This has to be done before 'Pointer <-> Pointer' as it's
  1865. // subtype polymorphism casting
  1866. if (check_is_assignable_to_using_subtype(src_type, t)) {
  1867. Type *st = type_deref(src_type);
  1868. st = type_deref(st);
  1869. bool st_is_ptr = is_type_pointer(src_type);
  1870. st = base_type(st);
  1871. Type *dt = t;
  1872. GB_ASSERT(is_type_struct(st) || is_type_raw_union(st));
  1873. Selection sel = {};
  1874. sel.index.allocator = heap_allocator();
  1875. defer (array_free(&sel.index));
  1876. if (lookup_subtype_polymorphic_selection(t, src_type, &sel)) {
  1877. if (sel.entity == nullptr) {
  1878. GB_PANIC("invalid subtype cast %s -> ", type_to_string(src_type), type_to_string(t));
  1879. }
  1880. if (st_is_ptr) {
  1881. lbValue res = lb_emit_deep_field_gep(p, value, sel);
  1882. Type *rt = res.type;
  1883. if (!are_types_identical(rt, dt) && are_types_identical(type_deref(rt), dt)) {
  1884. res = lb_emit_load(p, res);
  1885. }
  1886. return res;
  1887. } else {
  1888. if (is_type_pointer(value.type)) {
  1889. Type *rt = value.type;
  1890. if (!are_types_identical(rt, dt) && are_types_identical(type_deref(rt), dt)) {
  1891. value = lb_emit_load(p, value);
  1892. } else {
  1893. value = lb_emit_deep_field_gep(p, value, sel);
  1894. return lb_emit_load(p, value);
  1895. }
  1896. }
  1897. return lb_emit_deep_field_ev(p, value, sel);
  1898. }
  1899. }
  1900. }
  1901. // Pointer <-> Pointer
  1902. if (is_type_pointer(src) && is_type_pointer(dst)) {
  1903. lbValue res = {};
  1904. res.type = t;
  1905. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1906. return res;
  1907. }
  1908. if (is_type_multi_pointer(src) && is_type_pointer(dst)) {
  1909. lbValue res = {};
  1910. res.type = t;
  1911. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1912. return res;
  1913. }
  1914. if (is_type_pointer(src) && is_type_multi_pointer(dst)) {
  1915. lbValue res = {};
  1916. res.type = t;
  1917. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1918. return res;
  1919. }
  1920. if (is_type_multi_pointer(src) && is_type_multi_pointer(dst)) {
  1921. lbValue res = {};
  1922. res.type = t;
  1923. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1924. return res;
  1925. }
  1926. // proc <-> proc
  1927. if (is_type_proc(src) && is_type_proc(dst)) {
  1928. lbValue res = {};
  1929. res.type = t;
  1930. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1931. return res;
  1932. }
  1933. // pointer -> proc
  1934. if (is_type_pointer(src) && is_type_proc(dst)) {
  1935. lbValue res = {};
  1936. res.type = t;
  1937. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1938. return res;
  1939. }
  1940. // proc -> pointer
  1941. if (is_type_proc(src) && is_type_pointer(dst)) {
  1942. lbValue res = {};
  1943. res.type = t;
  1944. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1945. return res;
  1946. }
  1947. // []byte/[]u8 <-> string
  1948. if (is_type_u8_slice(src) && is_type_string(dst)) {
  1949. return lb_emit_transmute(p, value, t);
  1950. }
  1951. if (is_type_string(src) && is_type_u8_slice(dst)) {
  1952. return lb_emit_transmute(p, value, t);
  1953. }
  1954. if (is_type_array_like(dst)) {
  1955. Type *elem = base_array_type(dst);
  1956. isize index_count = cast(isize)get_array_type_count(dst);
  1957. isize inlineable = type_size_of(dst) <= build_context.max_simd_align;
  1958. lbValue e = lb_emit_conv(p, value, elem);
  1959. if (inlineable && lb_is_const(e)) {
  1960. lbAddr v = {};
  1961. if (e.value) {
  1962. TEMPORARY_ALLOCATOR_GUARD();
  1963. LLVMValueRef *values = gb_alloc_array(temporary_allocator(), LLVMValueRef, index_count);
  1964. for (isize i = 0; i < index_count; i++) {
  1965. values[i] = e.value;
  1966. }
  1967. lbValue array_const_value = {};
  1968. array_const_value.type = t;
  1969. array_const_value.value = LLVMConstArray(lb_type(m, elem), values, cast(unsigned)index_count);
  1970. v = lb_add_global_generated(m, t, array_const_value);
  1971. } else {
  1972. v = lb_add_global_generated(m, t);
  1973. }
  1974. lb_make_global_private_const(v);
  1975. return lb_addr_load(p, v);
  1976. }
  1977. // NOTE(bill): Doesn't need to be zero because it will be initialized in the loops
  1978. lbAddr v = lb_add_local_generated(p, t, false);
  1979. if (!inlineable) {
  1980. auto loop_data = lb_loop_start(p, index_count, t_int);
  1981. lbValue elem = lb_emit_array_ep(p, v.addr, loop_data.idx);
  1982. lb_emit_store(p, elem, e);
  1983. lb_loop_end(p, loop_data);
  1984. } else {
  1985. for (isize i = 0; i < index_count; i++) {
  1986. lbValue elem = lb_emit_array_epi(p, v.addr, i);
  1987. lb_emit_store(p, elem, e);
  1988. }
  1989. }
  1990. return lb_addr_load(p, v);
  1991. }
  1992. if (is_type_matrix(dst) && !is_type_matrix(src)) {
  1993. GB_ASSERT_MSG(dst->Matrix.row_count == dst->Matrix.column_count, "%s <- %s", type_to_string(dst), type_to_string(src));
  1994. Type *elem = base_array_type(dst);
  1995. lbValue e = lb_emit_conv(p, value, elem);
  1996. lbAddr v = lb_add_local_generated(p, t, false);
  1997. lbValue zero = lb_const_value(p->module, elem, exact_value_i64(0), true);
  1998. for (i64 j = 0; j < dst->Matrix.column_count; j++) {
  1999. for (i64 i = 0; i < dst->Matrix.row_count; i++) {
  2000. lbValue ptr = lb_emit_matrix_epi(p, v.addr, i, j);
  2001. lb_emit_store(p, ptr, i == j ? e : zero);
  2002. }
  2003. }
  2004. return lb_addr_load(p, v);
  2005. }
  2006. if (is_type_matrix(dst) && is_type_matrix(src)) {
  2007. GB_ASSERT(dst->kind == Type_Matrix);
  2008. GB_ASSERT(src->kind == Type_Matrix);
  2009. lbAddr v = lb_add_local_generated(p, t, true);
  2010. if (is_matrix_square(dst) && is_matrix_square(dst)) {
  2011. for (i64 j = 0; j < dst->Matrix.column_count; j++) {
  2012. for (i64 i = 0; i < dst->Matrix.row_count; i++) {
  2013. if (i < src->Matrix.row_count && j < src->Matrix.column_count) {
  2014. lbValue d = lb_emit_matrix_epi(p, v.addr, i, j);
  2015. lbValue s = lb_emit_matrix_ev(p, value, i, j);
  2016. lb_emit_store(p, d, s);
  2017. } else if (i == j) {
  2018. lbValue d = lb_emit_matrix_epi(p, v.addr, i, j);
  2019. lbValue s = lb_const_value(p->module, dst->Matrix.elem, exact_value_i64(1), true);
  2020. lb_emit_store(p, d, s);
  2021. }
  2022. }
  2023. }
  2024. } else {
  2025. i64 dst_count = dst->Matrix.row_count*dst->Matrix.column_count;
  2026. i64 src_count = src->Matrix.row_count*src->Matrix.column_count;
  2027. GB_ASSERT(dst_count == src_count);
  2028. lbValue pdst = v.addr;
  2029. lbValue psrc = lb_address_from_load_or_generate_local(p, value);
  2030. bool same_elem_base_types = are_types_identical(
  2031. base_type(dst->Matrix.elem),
  2032. base_type(src->Matrix.elem)
  2033. );
  2034. if (same_elem_base_types && type_size_of(dst) == type_size_of(src)) {
  2035. lb_mem_copy_overlapping(p, v.addr, psrc, lb_const_int(p->module, t_int, type_size_of(dst)));
  2036. } else {
  2037. for (i64 i = 0; i < src_count; i++) {
  2038. lbValue dp = lb_emit_array_epi(p, v.addr, matrix_column_major_index_to_offset(dst, i));
  2039. lbValue sp = lb_emit_array_epi(p, psrc, matrix_column_major_index_to_offset(src, i));
  2040. lbValue s = lb_emit_load(p, sp);
  2041. s = lb_emit_conv(p, s, dst->Matrix.elem);
  2042. lb_emit_store(p, dp, s);
  2043. }
  2044. }
  2045. }
  2046. return lb_addr_load(p, v);
  2047. }
  2048. if (is_type_any(dst)) {
  2049. if (is_type_untyped_uninit(src)) {
  2050. return lb_const_undef(p->module, t);
  2051. }
  2052. if (is_type_untyped_nil(src)) {
  2053. return lb_const_nil(p->module, t);
  2054. }
  2055. lbAddr result = lb_add_local_generated(p, t, true);
  2056. Type *st = default_type(src_type);
  2057. lbValue data = lb_address_from_load_or_generate_local(p, value);
  2058. GB_ASSERT_MSG(is_type_pointer(data.type), "%s", type_to_string(data.type));
  2059. GB_ASSERT_MSG(is_type_typed(st), "%s", type_to_string(st));
  2060. data = lb_emit_conv(p, data, t_rawptr);
  2061. lbValue id = lb_typeid(p->module, st);
  2062. lbValue any_data = lb_emit_struct_ep(p, result.addr, 0);
  2063. lbValue any_id = lb_emit_struct_ep(p, result.addr, 1);
  2064. lb_emit_store(p, any_data, data);
  2065. lb_emit_store(p, any_id, id);
  2066. return lb_addr_load(p, result);
  2067. }
  2068. i64 src_sz = type_size_of(src);
  2069. i64 dst_sz = type_size_of(dst);
  2070. if (src_sz == dst_sz) {
  2071. // bit_set <-> integer
  2072. if (is_type_integer(src) && is_type_bit_set(dst)) {
  2073. lbValue res = lb_emit_conv(p, value, bit_set_to_int(dst));
  2074. res.type = t;
  2075. return res;
  2076. }
  2077. if (is_type_bit_set(src) && is_type_integer(dst)) {
  2078. lbValue bs = value;
  2079. bs.type = bit_set_to_int(src);
  2080. return lb_emit_conv(p, bs, dst);
  2081. }
  2082. // typeid <-> integer
  2083. if (is_type_integer(src) && is_type_typeid(dst)) {
  2084. return lb_emit_transmute(p, value, dst);
  2085. }
  2086. if (is_type_typeid(src) && is_type_integer(dst)) {
  2087. return lb_emit_transmute(p, value, dst);
  2088. }
  2089. }
  2090. if (is_type_untyped(src)) {
  2091. if (is_type_string(src) && is_type_string(dst)) {
  2092. lbAddr result = lb_add_local_generated(p, t, false);
  2093. lb_addr_store(p, result, value);
  2094. return lb_addr_load(p, result);
  2095. }
  2096. }
  2097. gb_printf_err("%.*s\n", LIT(p->name));
  2098. gb_printf_err("lb_emit_conv: src -> dst\n");
  2099. gb_printf_err("Not Identical %s != %s\n", type_to_string(src_type), type_to_string(t));
  2100. gb_printf_err("Not Identical %s != %s\n", type_to_string(src), type_to_string(dst));
  2101. gb_printf_err("Not Identical %p != %p\n", src_type, t);
  2102. gb_printf_err("Not Identical %p != %p\n", src, dst);
  2103. GB_PANIC("Invalid type conversion: '%s' to '%s' for procedure '%.*s'",
  2104. type_to_string(src_type), type_to_string(t),
  2105. LIT(p->name));
  2106. return {};
  2107. }
  2108. gb_internal lbValue lb_emit_c_vararg(lbProcedure *p, lbValue arg, Type *type) {
  2109. Type *core = core_type(type);
  2110. if (core->kind == Type_BitSet) {
  2111. core = core_type(bit_set_to_int(core));
  2112. arg = lb_emit_transmute(p, arg, core);
  2113. }
  2114. Type *promoted = c_vararg_promote_type(core);
  2115. return lb_emit_conv(p, arg, promoted);
  2116. }
  2117. gb_internal lbValue lb_compare_records(lbProcedure *p, TokenKind op_kind, lbValue left, lbValue right, Type *type) {
  2118. GB_ASSERT((is_type_struct(type) || is_type_union(type)) && is_type_comparable(type));
  2119. lbValue left_ptr = lb_address_from_load_or_generate_local(p, left);
  2120. lbValue right_ptr = lb_address_from_load_or_generate_local(p, right);
  2121. lbValue res = {};
  2122. if (type_size_of(type) == 0) {
  2123. switch (op_kind) {
  2124. case Token_CmpEq:
  2125. return lb_const_bool(p->module, t_bool, true);
  2126. case Token_NotEq:
  2127. return lb_const_bool(p->module, t_bool, false);
  2128. }
  2129. GB_PANIC("invalid operator");
  2130. }
  2131. TEMPORARY_ALLOCATOR_GUARD();
  2132. if (is_type_simple_compare(type)) {
  2133. // TODO(bill): Test to see if this is actually faster!!!!
  2134. auto args = array_make<lbValue>(temporary_allocator(), 3);
  2135. args[0] = lb_emit_conv(p, left_ptr, t_rawptr);
  2136. args[1] = lb_emit_conv(p, right_ptr, t_rawptr);
  2137. args[2] = lb_const_int(p->module, t_int, type_size_of(type));
  2138. res = lb_emit_runtime_call(p, "memory_equal", args);
  2139. } else {
  2140. lbValue value = lb_equal_proc_for_type(p->module, type);
  2141. auto args = array_make<lbValue>(temporary_allocator(), 2);
  2142. args[0] = lb_emit_conv(p, left_ptr, t_rawptr);
  2143. args[1] = lb_emit_conv(p, right_ptr, t_rawptr);
  2144. res = lb_emit_call(p, value, args);
  2145. }
  2146. if (op_kind == Token_NotEq) {
  2147. res = lb_emit_unary_arith(p, Token_Not, res, res.type);
  2148. }
  2149. return res;
  2150. }
  2151. gb_internal lbValue lb_emit_comp(lbProcedure *p, TokenKind op_kind, lbValue left, lbValue right) {
  2152. Type *a = core_type(left.type);
  2153. Type *b = core_type(right.type);
  2154. GB_ASSERT(gb_is_between(op_kind, Token__ComparisonBegin+1, Token__ComparisonEnd-1));
  2155. lbValue nil_check = {};
  2156. if (is_type_array_like(left.type) || is_type_array_like(right.type)) {
  2157. // don't do `nil` check if it is array-like
  2158. } else if (is_type_untyped_nil(left.type)) {
  2159. nil_check = lb_emit_comp_against_nil(p, op_kind, right);
  2160. } else if (is_type_untyped_nil(right.type)) {
  2161. nil_check = lb_emit_comp_against_nil(p, op_kind, left);
  2162. }
  2163. if (nil_check.value != nullptr) {
  2164. return nil_check;
  2165. }
  2166. if (are_types_identical(a, b)) {
  2167. // NOTE(bill): No need for a conversion
  2168. } else if ((lb_is_const(left) && !is_type_array(left.type)) || lb_is_const_nil(left)) {
  2169. // NOTE(karl): !is_type_array(left.type) is there to avoid lb_emit_conv
  2170. // trying to convert a constant array into a non-array. In that case we
  2171. // want the `else` branch to happen, so it can try to convert the
  2172. // non-array into an array instead.
  2173. if (lb_is_const_nil(left)) {
  2174. if (internal_check_is_assignable_to(right.type, left.type)) {
  2175. right = lb_emit_conv(p, right, left.type);
  2176. }
  2177. return lb_emit_comp_against_nil(p, op_kind, right);
  2178. }
  2179. left = lb_emit_conv(p, left, right.type);
  2180. } else if ((lb_is_const(right) && !is_type_array(right.type)) || lb_is_const_nil(right)) {
  2181. if (lb_is_const_nil(right)) {
  2182. if (internal_check_is_assignable_to(left.type, right.type)) {
  2183. left = lb_emit_conv(p, left, right.type);
  2184. }
  2185. return lb_emit_comp_against_nil(p, op_kind, left);
  2186. }
  2187. right = lb_emit_conv(p, right, left.type);
  2188. } else {
  2189. Type *lt = left.type;
  2190. Type *rt = right.type;
  2191. lt = left.type;
  2192. rt = right.type;
  2193. i64 ls = type_size_of(lt);
  2194. i64 rs = type_size_of(rt);
  2195. // NOTE(bill): Quick heuristic, larger types are usually the target type
  2196. if (ls < rs) {
  2197. left = lb_emit_conv(p, left, rt);
  2198. } else if (ls > rs) {
  2199. right = lb_emit_conv(p, right, lt);
  2200. } else {
  2201. if (is_type_union(rt)) {
  2202. left = lb_emit_conv(p, left, rt);
  2203. } else {
  2204. right = lb_emit_conv(p, right, lt);
  2205. }
  2206. }
  2207. }
  2208. a = core_type(left.type);
  2209. b = core_type(right.type);
  2210. if (is_type_matrix(a) && (op_kind == Token_CmpEq || op_kind == Token_NotEq)) {
  2211. Type *tl = base_type(a);
  2212. lbValue lhs = lb_address_from_load_or_generate_local(p, left);
  2213. lbValue rhs = lb_address_from_load_or_generate_local(p, right);
  2214. // TODO(bill): Test to see if this is actually faster!!!!
  2215. auto args = array_make<lbValue>(permanent_allocator(), 3);
  2216. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2217. args[1] = lb_emit_conv(p, rhs, t_rawptr);
  2218. args[2] = lb_const_int(p->module, t_int, type_size_of(tl));
  2219. lbValue val = lb_emit_runtime_call(p, "memory_compare", args);
  2220. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_nil(p->module, val.type));
  2221. return lb_emit_conv(p, res, t_bool);
  2222. }
  2223. if (is_type_array_like(a)) {
  2224. Type *tl = base_type(a);
  2225. lbValue lhs = lb_address_from_load_or_generate_local(p, left);
  2226. lbValue rhs = lb_address_from_load_or_generate_local(p, right);
  2227. TokenKind cmp_op = Token_And;
  2228. lbValue res = lb_const_bool(p->module, t_llvm_bool, true);
  2229. if (op_kind == Token_NotEq) {
  2230. res = lb_const_bool(p->module, t_llvm_bool, false);
  2231. cmp_op = Token_Or;
  2232. } else if (op_kind == Token_CmpEq) {
  2233. res = lb_const_bool(p->module, t_llvm_bool, true);
  2234. cmp_op = Token_And;
  2235. }
  2236. bool inline_array_arith = lb_can_try_to_inline_array_arith(tl);
  2237. i32 count = 0;
  2238. switch (tl->kind) {
  2239. case Type_Array: count = cast(i32)tl->Array.count; break;
  2240. case Type_EnumeratedArray: count = cast(i32)tl->EnumeratedArray.count; break;
  2241. }
  2242. if (inline_array_arith) {
  2243. // inline
  2244. lbAddr val = lb_add_local_generated(p, t_bool, false);
  2245. lb_addr_store(p, val, res);
  2246. for (i32 i = 0; i < count; i++) {
  2247. lbValue x = lb_emit_load(p, lb_emit_array_epi(p, lhs, i));
  2248. lbValue y = lb_emit_load(p, lb_emit_array_epi(p, rhs, i));
  2249. lbValue cmp = lb_emit_comp(p, op_kind, x, y);
  2250. lbValue new_res = lb_emit_arith(p, cmp_op, lb_addr_load(p, val), cmp, t_bool);
  2251. lb_addr_store(p, val, lb_emit_conv(p, new_res, t_bool));
  2252. }
  2253. return lb_addr_load(p, val);
  2254. } else {
  2255. if (is_type_simple_compare(tl) && (op_kind == Token_CmpEq || op_kind == Token_NotEq)) {
  2256. // TODO(bill): Test to see if this is actually faster!!!!
  2257. auto args = array_make<lbValue>(permanent_allocator(), 3);
  2258. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2259. args[1] = lb_emit_conv(p, rhs, t_rawptr);
  2260. args[2] = lb_const_int(p->module, t_int, type_size_of(tl));
  2261. lbValue val = lb_emit_runtime_call(p, "memory_compare", args);
  2262. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_nil(p->module, val.type));
  2263. return lb_emit_conv(p, res, t_bool);
  2264. } else {
  2265. lbAddr val = lb_add_local_generated(p, t_bool, false);
  2266. lb_addr_store(p, val, res);
  2267. auto loop_data = lb_loop_start(p, count, t_i32);
  2268. {
  2269. lbValue i = loop_data.idx;
  2270. lbValue x = lb_emit_load(p, lb_emit_array_ep(p, lhs, i));
  2271. lbValue y = lb_emit_load(p, lb_emit_array_ep(p, rhs, i));
  2272. lbValue cmp = lb_emit_comp(p, op_kind, x, y);
  2273. lbValue new_res = lb_emit_arith(p, cmp_op, lb_addr_load(p, val), cmp, t_bool);
  2274. lb_addr_store(p, val, lb_emit_conv(p, new_res, t_bool));
  2275. }
  2276. lb_loop_end(p, loop_data);
  2277. return lb_addr_load(p, val);
  2278. }
  2279. }
  2280. }
  2281. if ((is_type_struct(a) || is_type_union(a)) && is_type_comparable(a)) {
  2282. return lb_compare_records(p, op_kind, left, right, a);
  2283. }
  2284. if ((is_type_struct(b) || is_type_union(b)) && is_type_comparable(b)) {
  2285. return lb_compare_records(p, op_kind, left, right, b);
  2286. }
  2287. if (is_type_string(a)) {
  2288. if (is_type_cstring(a) && is_type_cstring(b)) {
  2289. left = lb_emit_conv(p, left, t_cstring);
  2290. right = lb_emit_conv(p, right, t_cstring);
  2291. char const *runtime_procedure = nullptr;
  2292. switch (op_kind) {
  2293. case Token_CmpEq: runtime_procedure = "cstring_eq"; break;
  2294. case Token_NotEq: runtime_procedure = "cstring_ne"; break;
  2295. case Token_Lt: runtime_procedure = "cstring_lt"; break;
  2296. case Token_Gt: runtime_procedure = "cstring_gt"; break;
  2297. case Token_LtEq: runtime_procedure = "cstring_le"; break;
  2298. case Token_GtEq: runtime_procedure = "cstring_ge"; break;
  2299. }
  2300. GB_ASSERT(runtime_procedure != nullptr);
  2301. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2302. args[0] = left;
  2303. args[1] = right;
  2304. return lb_emit_runtime_call(p, runtime_procedure, args);
  2305. }
  2306. if (is_type_cstring(a) ^ is_type_cstring(b)) {
  2307. left = lb_emit_conv(p, left, t_string);
  2308. right = lb_emit_conv(p, right, t_string);
  2309. }
  2310. char const *runtime_procedure = nullptr;
  2311. switch (op_kind) {
  2312. case Token_CmpEq: runtime_procedure = "string_eq"; break;
  2313. case Token_NotEq: runtime_procedure = "string_ne"; break;
  2314. case Token_Lt: runtime_procedure = "string_lt"; break;
  2315. case Token_Gt: runtime_procedure = "string_gt"; break;
  2316. case Token_LtEq: runtime_procedure = "string_le"; break;
  2317. case Token_GtEq: runtime_procedure = "string_ge"; break;
  2318. }
  2319. GB_ASSERT(runtime_procedure != nullptr);
  2320. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2321. args[0] = left;
  2322. args[1] = right;
  2323. return lb_emit_runtime_call(p, runtime_procedure, args);
  2324. }
  2325. if (is_type_complex(a)) {
  2326. char const *runtime_procedure = "";
  2327. i64 sz = 8*type_size_of(a);
  2328. switch (sz) {
  2329. case 32:
  2330. switch (op_kind) {
  2331. case Token_CmpEq: runtime_procedure = "complex32_eq"; break;
  2332. case Token_NotEq: runtime_procedure = "complex32_ne"; break;
  2333. }
  2334. break;
  2335. case 64:
  2336. switch (op_kind) {
  2337. case Token_CmpEq: runtime_procedure = "complex64_eq"; break;
  2338. case Token_NotEq: runtime_procedure = "complex64_ne"; break;
  2339. }
  2340. break;
  2341. case 128:
  2342. switch (op_kind) {
  2343. case Token_CmpEq: runtime_procedure = "complex128_eq"; break;
  2344. case Token_NotEq: runtime_procedure = "complex128_ne"; break;
  2345. }
  2346. break;
  2347. }
  2348. GB_ASSERT(runtime_procedure != nullptr);
  2349. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2350. args[0] = left;
  2351. args[1] = right;
  2352. return lb_emit_runtime_call(p, runtime_procedure, args);
  2353. }
  2354. if (is_type_quaternion(a)) {
  2355. char const *runtime_procedure = "";
  2356. i64 sz = 8*type_size_of(a);
  2357. switch (sz) {
  2358. case 64:
  2359. switch (op_kind) {
  2360. case Token_CmpEq: runtime_procedure = "quaternion64_eq"; break;
  2361. case Token_NotEq: runtime_procedure = "quaternion64_ne"; break;
  2362. }
  2363. break;
  2364. case 128:
  2365. switch (op_kind) {
  2366. case Token_CmpEq: runtime_procedure = "quaternion128_eq"; break;
  2367. case Token_NotEq: runtime_procedure = "quaternion128_ne"; break;
  2368. }
  2369. break;
  2370. case 256:
  2371. switch (op_kind) {
  2372. case Token_CmpEq: runtime_procedure = "quaternion256_eq"; break;
  2373. case Token_NotEq: runtime_procedure = "quaternion256_ne"; break;
  2374. }
  2375. break;
  2376. }
  2377. GB_ASSERT(runtime_procedure != nullptr);
  2378. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2379. args[0] = left;
  2380. args[1] = right;
  2381. return lb_emit_runtime_call(p, runtime_procedure, args);
  2382. }
  2383. if (is_type_bit_set(a)) {
  2384. switch (op_kind) {
  2385. case Token_Lt:
  2386. case Token_LtEq:
  2387. case Token_Gt:
  2388. case Token_GtEq:
  2389. {
  2390. Type *it = bit_set_to_int(a);
  2391. lbValue lhs = lb_emit_transmute(p, left, it);
  2392. lbValue rhs = lb_emit_transmute(p, right, it);
  2393. lbValue res = lb_emit_arith(p, Token_And, lhs, rhs, it);
  2394. if (op_kind == Token_Lt || op_kind == Token_LtEq) {
  2395. // (lhs & rhs) == lhs
  2396. res.value = LLVMBuildICmp(p->builder, LLVMIntEQ, res.value, lhs.value, "");
  2397. res.type = t_llvm_bool;
  2398. } else if (op_kind == Token_Gt || op_kind == Token_GtEq) {
  2399. // (lhs & rhs) == rhs
  2400. res.value = LLVMBuildICmp(p->builder, LLVMIntEQ, res.value, rhs.value, "");
  2401. res.type = t_llvm_bool;
  2402. }
  2403. // NOTE(bill): Strict subsets
  2404. if (op_kind == Token_Lt || op_kind == Token_Gt) {
  2405. // res &~ (lhs == rhs)
  2406. lbValue eq = {};
  2407. eq.value = LLVMBuildICmp(p->builder, LLVMIntEQ, lhs.value, rhs.value, "");
  2408. eq.type = t_llvm_bool;
  2409. res = lb_emit_arith(p, Token_AndNot, res, eq, t_llvm_bool);
  2410. }
  2411. return res;
  2412. }
  2413. case Token_CmpEq:
  2414. case Token_NotEq:
  2415. {
  2416. LLVMIntPredicate pred = {};
  2417. switch (op_kind) {
  2418. case Token_CmpEq: pred = LLVMIntEQ; break;
  2419. case Token_NotEq: pred = LLVMIntNE; break;
  2420. }
  2421. lbValue res = {};
  2422. res.type = t_llvm_bool;
  2423. res.value = LLVMBuildICmp(p->builder, pred, left.value, right.value, "");
  2424. return res;
  2425. }
  2426. }
  2427. }
  2428. if (op_kind != Token_CmpEq && op_kind != Token_NotEq) {
  2429. Type *t = left.type;
  2430. if (is_type_integer(t) && is_type_different_to_arch_endianness(t)) {
  2431. Type *platform_type = integer_endian_type_to_platform_type(t);
  2432. lbValue x = lb_emit_byte_swap(p, left, platform_type);
  2433. lbValue y = lb_emit_byte_swap(p, right, platform_type);
  2434. left = x;
  2435. right = y;
  2436. } else if (is_type_float(t) && is_type_different_to_arch_endianness(t)) {
  2437. Type *platform_type = integer_endian_type_to_platform_type(t);
  2438. lbValue x = lb_emit_conv(p, left, platform_type);
  2439. lbValue y = lb_emit_conv(p, right, platform_type);
  2440. left = x;
  2441. right = y;
  2442. }
  2443. }
  2444. a = core_type(left.type);
  2445. b = core_type(right.type);
  2446. lbValue res = {};
  2447. res.type = t_llvm_bool;
  2448. if (is_type_integer(a) ||
  2449. is_type_boolean(a) ||
  2450. is_type_pointer(a) ||
  2451. is_type_multi_pointer(a) ||
  2452. is_type_proc(a) ||
  2453. is_type_enum(a)) {
  2454. LLVMIntPredicate pred = {};
  2455. if (is_type_unsigned(left.type)) {
  2456. switch (op_kind) {
  2457. case Token_Gt: pred = LLVMIntUGT; break;
  2458. case Token_GtEq: pred = LLVMIntUGE; break;
  2459. case Token_Lt: pred = LLVMIntULT; break;
  2460. case Token_LtEq: pred = LLVMIntULE; break;
  2461. }
  2462. } else {
  2463. switch (op_kind) {
  2464. case Token_Gt: pred = LLVMIntSGT; break;
  2465. case Token_GtEq: pred = LLVMIntSGE; break;
  2466. case Token_Lt: pred = LLVMIntSLT; break;
  2467. case Token_LtEq: pred = LLVMIntSLE; break;
  2468. }
  2469. }
  2470. switch (op_kind) {
  2471. case Token_CmpEq: pred = LLVMIntEQ; break;
  2472. case Token_NotEq: pred = LLVMIntNE; break;
  2473. }
  2474. LLVMValueRef lhs = left.value;
  2475. LLVMValueRef rhs = right.value;
  2476. if (LLVMTypeOf(lhs) != LLVMTypeOf(rhs)) {
  2477. if (lb_is_type_kind(LLVMTypeOf(lhs), LLVMPointerTypeKind)) {
  2478. rhs = LLVMBuildPointerCast(p->builder, rhs, LLVMTypeOf(lhs), "");
  2479. }
  2480. }
  2481. res.value = LLVMBuildICmp(p->builder, pred, lhs, rhs, "");
  2482. } else if (is_type_float(a)) {
  2483. LLVMRealPredicate pred = {};
  2484. switch (op_kind) {
  2485. case Token_CmpEq: pred = LLVMRealOEQ; break;
  2486. case Token_Gt: pred = LLVMRealOGT; break;
  2487. case Token_GtEq: pred = LLVMRealOGE; break;
  2488. case Token_Lt: pred = LLVMRealOLT; break;
  2489. case Token_LtEq: pred = LLVMRealOLE; break;
  2490. case Token_NotEq: pred = LLVMRealONE; break;
  2491. }
  2492. res.value = LLVMBuildFCmp(p->builder, pred, left.value, right.value, "");
  2493. } else if (is_type_typeid(a)) {
  2494. LLVMIntPredicate pred = {};
  2495. switch (op_kind) {
  2496. case Token_Gt: pred = LLVMIntUGT; break;
  2497. case Token_GtEq: pred = LLVMIntUGE; break;
  2498. case Token_Lt: pred = LLVMIntULT; break;
  2499. case Token_LtEq: pred = LLVMIntULE; break;
  2500. case Token_CmpEq: pred = LLVMIntEQ; break;
  2501. case Token_NotEq: pred = LLVMIntNE; break;
  2502. }
  2503. res.value = LLVMBuildICmp(p->builder, pred, left.value, right.value, "");
  2504. } else if (is_type_simd_vector(a)) {
  2505. LLVMValueRef mask = nullptr;
  2506. Type *elem = base_array_type(a);
  2507. if (is_type_float(elem)) {
  2508. LLVMRealPredicate pred = {};
  2509. switch (op_kind) {
  2510. case Token_CmpEq: pred = LLVMRealOEQ; break;
  2511. case Token_NotEq: pred = LLVMRealONE; break;
  2512. }
  2513. mask = LLVMBuildFCmp(p->builder, pred, left.value, right.value, "");
  2514. } else {
  2515. LLVMIntPredicate pred = {};
  2516. switch (op_kind) {
  2517. case Token_CmpEq: pred = LLVMIntEQ; break;
  2518. case Token_NotEq: pred = LLVMIntNE; break;
  2519. }
  2520. mask = LLVMBuildICmp(p->builder, pred, left.value, right.value, "");
  2521. }
  2522. GB_ASSERT_MSG(mask != nullptr, "Unhandled comparison kind %s (%s) %.*s %s (%s)", type_to_string(left.type), type_to_string(base_type(left.type)), LIT(token_strings[op_kind]), type_to_string(right.type), type_to_string(base_type(right.type)));
  2523. /* NOTE(bill, 2022-05-28):
  2524. Thanks to Per Vognsen, sign extending <N x i1> to
  2525. a vector of the same width as the input vector, bit casting to an integer,
  2526. and then comparing against zero is the better option
  2527. See: https://lists.llvm.org/pipermail/llvm-dev/2012-September/053046.html
  2528. // Example assuming 128-bit vector
  2529. %1 = <4 x float> ...
  2530. %2 = <4 x float> ...
  2531. %3 = fcmp oeq <4 x float> %1, %2
  2532. %4 = sext <4 x i1> %3 to <4 x i32>
  2533. %5 = bitcast <4 x i32> %4 to i128
  2534. %6 = icmp ne i128 %5, 0
  2535. br i1 %6, label %true1, label %false2
  2536. This will result in 1 cmpps + 1 ptest + 1 br
  2537. (even without SSE4.1, contrary to what the mail list states, because of pmovmskb)
  2538. */
  2539. unsigned count = cast(unsigned)get_array_type_count(a);
  2540. unsigned elem_sz = cast(unsigned)(type_size_of(elem)*8);
  2541. LLVMTypeRef mask_type = LLVMVectorType(LLVMIntTypeInContext(p->module->ctx, elem_sz), count);
  2542. mask = LLVMBuildSExtOrBitCast(p->builder, mask, mask_type, "");
  2543. LLVMTypeRef mask_int_type = LLVMIntTypeInContext(p->module->ctx, cast(unsigned)(8*type_size_of(a)));
  2544. LLVMValueRef mask_int = LLVMBuildBitCast(p->builder, mask, mask_int_type, "");
  2545. res.value = LLVMBuildICmp(p->builder, LLVMIntNE, mask_int, LLVMConstNull(LLVMTypeOf(mask_int)), "");
  2546. return res;
  2547. } else {
  2548. GB_PANIC("Unhandled comparison kind %s (%s) %.*s %s (%s)", type_to_string(left.type), type_to_string(base_type(left.type)), LIT(token_strings[op_kind]), type_to_string(right.type), type_to_string(base_type(right.type)));
  2549. }
  2550. return res;
  2551. }
  2552. gb_internal lbValue lb_emit_comp_against_nil(lbProcedure *p, TokenKind op_kind, lbValue x) {
  2553. lbValue res = {};
  2554. res.type = t_llvm_bool;
  2555. Type *t = x.type;
  2556. Type *bt = base_type(t);
  2557. TypeKind type_kind = bt->kind;
  2558. switch (type_kind) {
  2559. case Type_Basic:
  2560. switch (bt->Basic.kind) {
  2561. case Basic_rawptr:
  2562. case Basic_cstring:
  2563. if (op_kind == Token_CmpEq) {
  2564. res.value = LLVMBuildIsNull(p->builder, x.value, "");
  2565. } else if (op_kind == Token_NotEq) {
  2566. res.value = LLVMBuildIsNotNull(p->builder, x.value, "");
  2567. }
  2568. return res;
  2569. case Basic_any:
  2570. {
  2571. // TODO(bill): is this correct behaviour for nil comparison for any?
  2572. lbValue data = lb_emit_struct_ev(p, x, 0);
  2573. lbValue ti = lb_emit_struct_ev(p, x, 1);
  2574. if (op_kind == Token_CmpEq) {
  2575. LLVMValueRef a = LLVMBuildIsNull(p->builder, data.value, "");
  2576. LLVMValueRef b = LLVMBuildIsNull(p->builder, ti.value, "");
  2577. res.value = LLVMBuildOr(p->builder, a, b, "");
  2578. return res;
  2579. } else if (op_kind == Token_NotEq) {
  2580. LLVMValueRef a = LLVMBuildIsNotNull(p->builder, data.value, "");
  2581. LLVMValueRef b = LLVMBuildIsNotNull(p->builder, ti.value, "");
  2582. res.value = LLVMBuildAnd(p->builder, a, b, "");
  2583. return res;
  2584. }
  2585. }
  2586. break;
  2587. case Basic_typeid:
  2588. lbValue invalid_typeid = lb_const_value(p->module, t_typeid, exact_value_i64(0));
  2589. return lb_emit_comp(p, op_kind, x, invalid_typeid);
  2590. }
  2591. break;
  2592. case Type_Enum:
  2593. case Type_Pointer:
  2594. case Type_MultiPointer:
  2595. case Type_Proc:
  2596. if (op_kind == Token_CmpEq) {
  2597. res.value = LLVMBuildIsNull(p->builder, x.value, "");
  2598. } else if (op_kind == Token_NotEq) {
  2599. res.value = LLVMBuildIsNotNull(p->builder, x.value, "");
  2600. }
  2601. return res;
  2602. case Type_BitSet:
  2603. {
  2604. Type *u = bit_set_to_int(bt);
  2605. if (is_type_array(u)) {
  2606. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2607. lbValue lhs = lb_address_from_load_or_generate_local(p, x);
  2608. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2609. args[1] = lb_const_int(p->module, t_int, type_size_of(t));
  2610. lbValue val = lb_emit_runtime_call(p, "memory_compare_zero", args);
  2611. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_int(p->module, t_int, 0));
  2612. return res;
  2613. } else {
  2614. if (op_kind == Token_CmpEq) {
  2615. res.value = LLVMBuildIsNull(p->builder, x.value, "");
  2616. } else if (op_kind == Token_NotEq) {
  2617. res.value = LLVMBuildIsNotNull(p->builder, x.value, "");
  2618. }
  2619. }
  2620. return res;
  2621. }
  2622. case Type_Slice:
  2623. {
  2624. lbValue data = lb_emit_struct_ev(p, x, 0);
  2625. if (op_kind == Token_CmpEq) {
  2626. res.value = LLVMBuildIsNull(p->builder, data.value, "");
  2627. return res;
  2628. } else if (op_kind == Token_NotEq) {
  2629. res.value = LLVMBuildIsNotNull(p->builder, data.value, "");
  2630. return res;
  2631. }
  2632. }
  2633. break;
  2634. case Type_DynamicArray:
  2635. {
  2636. lbValue data = lb_emit_struct_ev(p, x, 0);
  2637. if (op_kind == Token_CmpEq) {
  2638. res.value = LLVMBuildIsNull(p->builder, data.value, "");
  2639. return res;
  2640. } else if (op_kind == Token_NotEq) {
  2641. res.value = LLVMBuildIsNotNull(p->builder, data.value, "");
  2642. return res;
  2643. }
  2644. }
  2645. break;
  2646. case Type_Map:
  2647. {
  2648. lbValue data_ptr = lb_emit_struct_ev(p, x, 0);
  2649. if (op_kind == Token_CmpEq) {
  2650. res.value = LLVMBuildIsNull(p->builder, data_ptr.value, "");
  2651. return res;
  2652. } else {
  2653. res.value = LLVMBuildIsNotNull(p->builder, data_ptr.value, "");
  2654. return res;
  2655. }
  2656. }
  2657. break;
  2658. case Type_Union:
  2659. {
  2660. if (type_size_of(t) == 0) {
  2661. if (op_kind == Token_CmpEq) {
  2662. return lb_const_bool(p->module, t_llvm_bool, true);
  2663. } else if (op_kind == Token_NotEq) {
  2664. return lb_const_bool(p->module, t_llvm_bool, false);
  2665. }
  2666. } else if (is_type_union_maybe_pointer(t)) {
  2667. lbValue tag = lb_emit_transmute(p, x, t_rawptr);
  2668. return lb_emit_comp_against_nil(p, op_kind, tag);
  2669. } else {
  2670. lbValue tag = lb_emit_union_tag_value(p, x);
  2671. return lb_emit_comp(p, op_kind, tag, lb_zero(p->module, tag.type));
  2672. }
  2673. }
  2674. case Type_Struct:
  2675. if (is_type_soa_struct(t)) {
  2676. Type *bt = base_type(t);
  2677. if (bt->Struct.soa_kind == StructSoa_Slice) {
  2678. LLVMValueRef the_value = {};
  2679. if (bt->Struct.fields.count == 0) {
  2680. lbValue len = lb_soa_struct_len(p, x);
  2681. the_value = len.value;
  2682. } else {
  2683. lbValue first_field = lb_emit_struct_ev(p, x, 0);
  2684. the_value = first_field.value;
  2685. }
  2686. if (op_kind == Token_CmpEq) {
  2687. res.value = LLVMBuildIsNull(p->builder, the_value, "");
  2688. return res;
  2689. } else if (op_kind == Token_NotEq) {
  2690. res.value = LLVMBuildIsNotNull(p->builder, the_value, "");
  2691. return res;
  2692. }
  2693. } else if (bt->Struct.soa_kind == StructSoa_Dynamic) {
  2694. LLVMValueRef the_value = {};
  2695. if (bt->Struct.fields.count == 0) {
  2696. lbValue cap = lb_soa_struct_cap(p, x);
  2697. the_value = cap.value;
  2698. } else {
  2699. lbValue first_field = lb_emit_struct_ev(p, x, 0);
  2700. the_value = first_field.value;
  2701. }
  2702. if (op_kind == Token_CmpEq) {
  2703. res.value = LLVMBuildIsNull(p->builder, the_value, "");
  2704. return res;
  2705. } else if (op_kind == Token_NotEq) {
  2706. res.value = LLVMBuildIsNotNull(p->builder, the_value, "");
  2707. return res;
  2708. }
  2709. }
  2710. } else if (is_type_struct(t) && type_has_nil(t)) {
  2711. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2712. lbValue lhs = lb_address_from_load_or_generate_local(p, x);
  2713. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2714. args[1] = lb_const_int(p->module, t_int, type_size_of(t));
  2715. lbValue val = lb_emit_runtime_call(p, "memory_compare_zero", args);
  2716. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_int(p->module, t_int, 0));
  2717. return res;
  2718. }
  2719. break;
  2720. }
  2721. GB_PANIC("Unknown handled type: %s -> %s", type_to_string(t), type_to_string(bt));
  2722. return {};
  2723. }
  2724. gb_internal lbValue lb_build_unary_and(lbProcedure *p, Ast *expr) {
  2725. ast_node(ue, UnaryExpr, expr);
  2726. auto tv = type_and_value_of_expr(expr);
  2727. Ast *ue_expr = unparen_expr(ue->expr);
  2728. if (ue_expr->kind == Ast_IndexExpr && tv.mode == Addressing_OptionalOkPtr && is_type_tuple(tv.type)) {
  2729. Type *tuple = tv.type;
  2730. Type *map_type = type_of_expr(ue_expr->IndexExpr.expr);
  2731. Type *ot = base_type(map_type);
  2732. Type *t = base_type(type_deref(ot));
  2733. bool deref = t != ot;
  2734. GB_ASSERT(t->kind == Type_Map);
  2735. ast_node(ie, IndexExpr, ue_expr);
  2736. lbValue map_val = lb_build_addr_ptr(p, ie->expr);
  2737. if (deref) {
  2738. map_val = lb_emit_load(p, map_val);
  2739. }
  2740. lbValue key = lb_build_expr(p, ie->index);
  2741. key = lb_emit_conv(p, key, t->Map.key);
  2742. lbAddr addr = lb_addr_map(map_val, key, t, alloc_type_pointer(t->Map.value));
  2743. lbValue ptr = lb_addr_get_ptr(p, addr);
  2744. lbValue ok = lb_emit_comp_against_nil(p, Token_NotEq, ptr);
  2745. ok = lb_emit_conv(p, ok, tuple->Tuple.variables[1]->type);
  2746. lbAddr res = lb_add_local_generated(p, tuple, false);
  2747. lbValue gep0 = lb_emit_struct_ep(p, res.addr, 0);
  2748. lbValue gep1 = lb_emit_struct_ep(p, res.addr, 1);
  2749. lb_emit_store(p, gep0, ptr);
  2750. lb_emit_store(p, gep1, ok);
  2751. return lb_addr_load(p, res);
  2752. } else if (is_type_soa_pointer(tv.type)) {
  2753. ast_node(ie, IndexExpr, ue_expr);
  2754. lbValue addr = lb_build_addr_ptr(p, ie->expr);
  2755. if (is_type_pointer(type_deref(addr.type))) {
  2756. addr = lb_emit_load(p, addr);
  2757. }
  2758. GB_ASSERT(is_type_pointer(addr.type));
  2759. lbValue index = lb_build_expr(p, ie->index);
  2760. if (!build_context.no_bounds_check) {
  2761. // TODO(bill): soa bounds checking
  2762. }
  2763. return lb_make_soa_pointer(p, tv.type, addr, index);
  2764. } else if (ue_expr->kind == Ast_CompoundLit) {
  2765. lbValue v = lb_build_expr(p, ue->expr);
  2766. Type *type = v.type;
  2767. lbAddr addr = {};
  2768. if (p->is_startup) {
  2769. addr = lb_add_global_generated(p->module, type, v);
  2770. } else {
  2771. addr = lb_add_local_generated(p, type, false);
  2772. }
  2773. lb_addr_store(p, addr, v);
  2774. return addr.addr;
  2775. } else if (ue_expr->kind == Ast_TypeAssertion) {
  2776. if (is_type_tuple(tv.type)) {
  2777. Type *tuple = tv.type;
  2778. Type *ptr_type = tuple->Tuple.variables[0]->type;
  2779. Type *ok_type = tuple->Tuple.variables[1]->type;
  2780. ast_node(ta, TypeAssertion, ue_expr);
  2781. TokenPos pos = ast_token(expr).pos;
  2782. Type *type = type_of_expr(ue_expr);
  2783. GB_ASSERT(!is_type_tuple(type));
  2784. lbValue e = lb_build_expr(p, ta->expr);
  2785. Type *t = type_deref(e.type);
  2786. if (is_type_union(t)) {
  2787. lbValue v = e;
  2788. if (!is_type_pointer(v.type)) {
  2789. v = lb_address_from_load_or_generate_local(p, v);
  2790. }
  2791. Type *src_type = type_deref(v.type);
  2792. Type *dst_type = type;
  2793. lbValue src_tag = {};
  2794. lbValue dst_tag = {};
  2795. if (is_type_union_maybe_pointer(src_type)) {
  2796. src_tag = lb_emit_comp_against_nil(p, Token_NotEq, v);
  2797. dst_tag = lb_const_bool(p->module, t_bool, true);
  2798. } else {
  2799. src_tag = lb_emit_load(p, lb_emit_union_tag_ptr(p, v));
  2800. dst_tag = lb_const_union_tag(p->module, src_type, dst_type);
  2801. }
  2802. lbValue ok = lb_emit_comp(p, Token_CmpEq, src_tag, dst_tag);
  2803. lbValue data_ptr = lb_emit_conv(p, v, ptr_type);
  2804. lbAddr res = lb_add_local_generated(p, tuple, true);
  2805. lbValue gep0 = lb_emit_struct_ep(p, res.addr, 0);
  2806. lbValue gep1 = lb_emit_struct_ep(p, res.addr, 1);
  2807. lb_emit_store(p, gep0, lb_emit_select(p, ok, data_ptr, lb_const_nil(p->module, ptr_type)));
  2808. lb_emit_store(p, gep1, lb_emit_conv(p, ok, ok_type));
  2809. return lb_addr_load(p, res);
  2810. } else if (is_type_any(t)) {
  2811. lbValue v = e;
  2812. if (is_type_pointer(v.type)) {
  2813. v = lb_emit_load(p, v);
  2814. }
  2815. lbValue data_ptr = lb_emit_conv(p, lb_emit_struct_ev(p, v, 0), ptr_type);
  2816. lbValue any_id = lb_emit_struct_ev(p, v, 1);
  2817. lbValue id = lb_typeid(p->module, type);
  2818. lbValue ok = lb_emit_comp(p, Token_CmpEq, any_id, id);
  2819. lbAddr res = lb_add_local_generated(p, tuple, false);
  2820. lbValue gep0 = lb_emit_struct_ep(p, res.addr, 0);
  2821. lbValue gep1 = lb_emit_struct_ep(p, res.addr, 1);
  2822. lb_emit_store(p, gep0, lb_emit_select(p, ok, data_ptr, lb_const_nil(p->module, ptr_type)));
  2823. lb_emit_store(p, gep1, lb_emit_conv(p, ok, ok_type));
  2824. return lb_addr_load(p, res);
  2825. } else {
  2826. GB_PANIC("TODO(bill): type assertion %s", type_to_string(type));
  2827. }
  2828. } else {
  2829. GB_ASSERT(is_type_pointer(tv.type));
  2830. ast_node(ta, TypeAssertion, ue_expr);
  2831. TokenPos pos = ast_token(expr).pos;
  2832. Type *type = type_of_expr(ue_expr);
  2833. GB_ASSERT(!is_type_tuple(type));
  2834. lbValue e = lb_build_expr(p, ta->expr);
  2835. Type *t = type_deref(e.type);
  2836. if (is_type_union(t)) {
  2837. lbValue v = e;
  2838. if (!is_type_pointer(v.type)) {
  2839. v = lb_address_from_load_or_generate_local(p, v);
  2840. }
  2841. Type *src_type = type_deref(v.type);
  2842. Type *dst_type = type;
  2843. if (!build_context.no_type_assert && (p->state_flags & StateFlag_no_type_assert) == 0) {
  2844. lbValue src_tag = {};
  2845. lbValue dst_tag = {};
  2846. if (is_type_union_maybe_pointer(src_type)) {
  2847. src_tag = lb_emit_comp_against_nil(p, Token_NotEq, v);
  2848. dst_tag = lb_const_bool(p->module, t_bool, true);
  2849. } else {
  2850. src_tag = lb_emit_load(p, lb_emit_union_tag_ptr(p, v));
  2851. dst_tag = lb_const_union_tag(p->module, src_type, dst_type);
  2852. }
  2853. isize arg_count = 6;
  2854. if (build_context.no_rtti) {
  2855. arg_count = 4;
  2856. }
  2857. lbValue ok = lb_emit_comp(p, Token_CmpEq, src_tag, dst_tag);
  2858. auto args = array_make<lbValue>(permanent_allocator(), arg_count);
  2859. args[0] = ok;
  2860. args[1] = lb_find_or_add_entity_string(p->module, get_file_path_string(pos.file_id));
  2861. args[2] = lb_const_int(p->module, t_i32, pos.line);
  2862. args[3] = lb_const_int(p->module, t_i32, pos.column);
  2863. if (!build_context.no_rtti) {
  2864. args[4] = lb_typeid(p->module, src_type);
  2865. args[5] = lb_typeid(p->module, dst_type);
  2866. }
  2867. lb_emit_runtime_call(p, "type_assertion_check", args);
  2868. }
  2869. lbValue data_ptr = v;
  2870. return lb_emit_conv(p, data_ptr, tv.type);
  2871. } else if (is_type_any(t)) {
  2872. lbValue v = e;
  2873. if (is_type_pointer(v.type)) {
  2874. v = lb_emit_load(p, v);
  2875. }
  2876. lbValue data_ptr = lb_emit_struct_ev(p, v, 0);
  2877. if (!build_context.no_type_assert && (p->state_flags & StateFlag_no_type_assert) == 0) {
  2878. GB_ASSERT(!build_context.no_rtti);
  2879. lbValue any_id = lb_emit_struct_ev(p, v, 1);
  2880. lbValue id = lb_typeid(p->module, type);
  2881. lbValue ok = lb_emit_comp(p, Token_CmpEq, any_id, id);
  2882. auto args = array_make<lbValue>(permanent_allocator(), 6);
  2883. args[0] = ok;
  2884. args[1] = lb_find_or_add_entity_string(p->module, get_file_path_string(pos.file_id));
  2885. args[2] = lb_const_int(p->module, t_i32, pos.line);
  2886. args[3] = lb_const_int(p->module, t_i32, pos.column);
  2887. args[4] = any_id;
  2888. args[5] = id;
  2889. lb_emit_runtime_call(p, "type_assertion_check", args);
  2890. }
  2891. return lb_emit_conv(p, data_ptr, tv.type);
  2892. } else {
  2893. GB_PANIC("TODO(bill): type assertion %s", type_to_string(type));
  2894. }
  2895. }
  2896. }
  2897. return lb_build_addr_ptr(p, ue->expr);
  2898. }
  2899. gb_internal lbValue lb_build_expr_internal(lbProcedure *p, Ast *expr);
  2900. gb_internal lbValue lb_build_expr(lbProcedure *p, Ast *expr) {
  2901. u16 prev_state_flags = p->state_flags;
  2902. defer (p->state_flags = prev_state_flags);
  2903. if (expr->state_flags != 0) {
  2904. u16 in = expr->state_flags;
  2905. u16 out = p->state_flags;
  2906. if (in & StateFlag_bounds_check) {
  2907. out |= StateFlag_bounds_check;
  2908. out &= ~StateFlag_no_bounds_check;
  2909. } else if (in & StateFlag_no_bounds_check) {
  2910. out |= StateFlag_no_bounds_check;
  2911. out &= ~StateFlag_bounds_check;
  2912. }
  2913. if (in & StateFlag_type_assert) {
  2914. out |= StateFlag_type_assert;
  2915. out &= ~StateFlag_no_type_assert;
  2916. } else if (in & StateFlag_no_type_assert) {
  2917. out |= StateFlag_no_type_assert;
  2918. out &= ~StateFlag_type_assert;
  2919. }
  2920. p->state_flags = out;
  2921. }
  2922. // IMPORTANT NOTE(bill):
  2923. // Selector Call Expressions (foo->bar(...))
  2924. // must only evaluate `foo` once as it gets transformed into
  2925. // `foo.bar(foo, ...)`
  2926. // And if `foo` is a procedure call or something more complex, storing the value
  2927. // once is a very good idea
  2928. // If a stored value is found, it must be removed from the cache
  2929. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  2930. lbValue *pp = map_get(&p->selector_values, expr);
  2931. if (pp != nullptr) {
  2932. lbValue res = *pp;
  2933. map_remove(&p->selector_values, expr);
  2934. return res;
  2935. }
  2936. lbAddr *pa = map_get(&p->selector_addr, expr);
  2937. if (pa != nullptr) {
  2938. lbAddr res = *pa;
  2939. map_remove(&p->selector_addr, expr);
  2940. return lb_addr_load(p, res);
  2941. }
  2942. }
  2943. lbValue res = lb_build_expr_internal(p, expr);
  2944. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  2945. map_set(&p->selector_values, expr, res);
  2946. }
  2947. return res;
  2948. }
  2949. gb_internal lbValue lb_build_expr_internal(lbProcedure *p, Ast *expr) {
  2950. lbModule *m = p->module;
  2951. expr = unparen_expr(expr);
  2952. TokenPos expr_pos = ast_token(expr).pos;
  2953. TypeAndValue tv = type_and_value_of_expr(expr);
  2954. Type *type = type_of_expr(expr);
  2955. GB_ASSERT_MSG(tv.mode != Addressing_Invalid, "invalid expression '%s' (tv.mode = %d, tv.type = %s) @ %s\n Current Proc: %.*s : %s", expr_to_string(expr), tv.mode, type_to_string(tv.type), token_pos_to_string(expr_pos), LIT(p->name), type_to_string(p->type));
  2956. if (tv.value.kind != ExactValue_Invalid) {
  2957. // NOTE(bill): Short on constant values
  2958. return lb_const_value(p->module, type, tv.value);
  2959. } else if (tv.mode == Addressing_Type) {
  2960. // NOTE(bill, 2023-01-16): is this correct? I hope so at least
  2961. return lb_typeid(m, tv.type);
  2962. }
  2963. switch (expr->kind) {
  2964. case_ast_node(bl, BasicLit, expr);
  2965. if (type != nullptr && type->Named.name == "Error") {
  2966. Entity *e = type->Named.type_name;
  2967. if (e->pkg && e->pkg->name == "os") {
  2968. return lb_const_nil(p->module, type);
  2969. }
  2970. }
  2971. TokenPos pos = bl->token.pos;
  2972. GB_PANIC("Non-constant basic literal %s - %.*s (%s)", token_pos_to_string(pos), LIT(token_strings[bl->token.kind]), type_to_string(type));
  2973. case_end;
  2974. case_ast_node(bd, BasicDirective, expr);
  2975. TokenPos pos = bd->token.pos;
  2976. GB_PANIC("Non-constant basic literal %s - %.*s", token_pos_to_string(pos), LIT(bd->name.string));
  2977. case_end;
  2978. case_ast_node(i, Implicit, expr);
  2979. return lb_addr_load(p, lb_build_addr(p, expr));
  2980. case_end;
  2981. case_ast_node(u, Uninit, expr)
  2982. lbValue res = {};
  2983. if (is_type_untyped(type)) {
  2984. res.value = nullptr;
  2985. res.type = t_untyped_uninit;
  2986. } else {
  2987. res.value = LLVMGetUndef(lb_type(m, type));
  2988. res.type = type;
  2989. }
  2990. return res;
  2991. case_end;
  2992. case_ast_node(i, Ident, expr);
  2993. Entity *e = entity_from_expr(expr);
  2994. e = strip_entity_wrapping(e);
  2995. GB_ASSERT_MSG(e != nullptr, "%s in %.*s %p", expr_to_string(expr), LIT(p->name), expr);
  2996. if (e->kind == Entity_Builtin) {
  2997. Token token = ast_token(expr);
  2998. GB_PANIC("TODO(bill): lb_build_expr Entity_Builtin '%.*s'\n"
  2999. "\t at %s", LIT(builtin_procs[e->Builtin.id].name),
  3000. token_pos_to_string(token.pos));
  3001. return {};
  3002. } else if (e->kind == Entity_Nil) {
  3003. lbValue res = {};
  3004. res.value = nullptr;
  3005. res.type = e->type;
  3006. return res;
  3007. }
  3008. GB_ASSERT(e->kind != Entity_ProcGroup);
  3009. return lb_find_ident(p, m, e, expr);
  3010. case_end;
  3011. case_ast_node(de, DerefExpr, expr);
  3012. return lb_addr_load(p, lb_build_addr(p, expr));
  3013. case_end;
  3014. case_ast_node(se, SelectorExpr, expr);
  3015. TypeAndValue tav = type_and_value_of_expr(expr);
  3016. GB_ASSERT(tav.mode != Addressing_Invalid);
  3017. return lb_addr_load(p, lb_build_addr(p, expr));
  3018. case_end;
  3019. case_ast_node(ise, ImplicitSelectorExpr, expr);
  3020. TypeAndValue tav = type_and_value_of_expr(expr);
  3021. GB_ASSERT(tav.mode == Addressing_Constant);
  3022. return lb_const_value(p->module, type, tv.value);
  3023. case_end;
  3024. case_ast_node(se, SelectorCallExpr, expr);
  3025. GB_ASSERT(se->modified_call);
  3026. return lb_build_call_expr(p, se->call);
  3027. case_end;
  3028. case_ast_node(te, TernaryIfExpr, expr);
  3029. LLVMValueRef incoming_values[2] = {};
  3030. LLVMBasicBlockRef incoming_blocks[2] = {};
  3031. GB_ASSERT(te->y != nullptr);
  3032. lbBlock *then = lb_create_block(p, "if.then");
  3033. lbBlock *done = lb_create_block(p, "if.done"); // NOTE(bill): Append later
  3034. lbBlock *else_ = lb_create_block(p, "if.else");
  3035. lb_build_cond(p, te->cond, then, else_);
  3036. lb_start_block(p, then);
  3037. Type *type = default_type(type_of_expr(expr));
  3038. LLVMTypeRef llvm_type = lb_type(p->module, type);
  3039. incoming_values[0] = lb_emit_conv(p, lb_build_expr(p, te->x), type).value;
  3040. if (is_type_internally_pointer_like(type)) {
  3041. incoming_values[0] = LLVMBuildBitCast(p->builder, incoming_values[0], llvm_type, "");
  3042. }
  3043. lb_emit_jump(p, done);
  3044. lb_start_block(p, else_);
  3045. incoming_values[1] = lb_emit_conv(p, lb_build_expr(p, te->y), type).value;
  3046. if (is_type_internally_pointer_like(type)) {
  3047. incoming_values[1] = LLVMBuildBitCast(p->builder, incoming_values[1], llvm_type, "");
  3048. }
  3049. lb_emit_jump(p, done);
  3050. lb_start_block(p, done);
  3051. lbValue res = {};
  3052. res.value = LLVMBuildPhi(p->builder, llvm_type, "");
  3053. res.type = type;
  3054. GB_ASSERT(p->curr_block->preds.count >= 2);
  3055. incoming_blocks[0] = p->curr_block->preds[0]->block;
  3056. incoming_blocks[1] = p->curr_block->preds[1]->block;
  3057. LLVMAddIncoming(res.value, incoming_values, incoming_blocks, 2);
  3058. return res;
  3059. case_end;
  3060. case_ast_node(te, TernaryWhenExpr, expr);
  3061. TypeAndValue tav = type_and_value_of_expr(te->cond);
  3062. GB_ASSERT(tav.mode == Addressing_Constant);
  3063. GB_ASSERT(tav.value.kind == ExactValue_Bool);
  3064. if (tav.value.value_bool) {
  3065. return lb_build_expr(p, te->x);
  3066. } else {
  3067. return lb_build_expr(p, te->y);
  3068. }
  3069. case_end;
  3070. case_ast_node(oe, OrElseExpr, expr);
  3071. return lb_emit_or_else(p, oe->x, oe->y, tv);
  3072. case_end;
  3073. case_ast_node(oe, OrReturnExpr, expr);
  3074. return lb_emit_or_return(p, oe->expr, tv);
  3075. case_end;
  3076. case_ast_node(be, OrBranchExpr, expr);
  3077. lbBlock *block = nullptr;
  3078. if (be->label != nullptr) {
  3079. lbBranchBlocks bb = lb_lookup_branch_blocks(p, be->label);
  3080. switch (be->token.kind) {
  3081. case Token_or_break: block = bb.break_; break;
  3082. case Token_or_continue: block = bb.continue_; break;
  3083. }
  3084. } else {
  3085. for (lbTargetList *t = p->target_list; t != nullptr && block == nullptr; t = t->prev) {
  3086. if (t->is_block) {
  3087. continue;
  3088. }
  3089. switch (be->token.kind) {
  3090. case Token_or_break: block = t->break_; break;
  3091. case Token_or_continue: block = t->continue_; break;
  3092. }
  3093. }
  3094. }
  3095. GB_ASSERT(block != nullptr);
  3096. lbValue lhs = {};
  3097. lbValue rhs = {};
  3098. lb_emit_try_lhs_rhs(p, be->expr, tv, &lhs, &rhs);
  3099. Type *type = default_type(tv.type);
  3100. if (lhs.value) {
  3101. lhs = lb_emit_conv(p, lhs, type);
  3102. } else if (type != nullptr && type != t_invalid) {
  3103. lhs = lb_const_nil(p->module, type);
  3104. }
  3105. lbBlock *then = lb_create_block(p, "or_branch.then");
  3106. lbBlock *else_ = lb_create_block(p, "or_branch.else");
  3107. lb_emit_if(p, lb_emit_try_has_value(p, rhs), then, else_);
  3108. lb_start_block(p, else_);
  3109. lb_emit_defer_stmts(p, lbDeferExit_Branch, block);
  3110. lb_emit_jump(p, block);
  3111. lb_start_block(p, then);
  3112. return lhs;
  3113. case_end;
  3114. case_ast_node(ta, TypeAssertion, expr);
  3115. TokenPos pos = ast_token(expr).pos;
  3116. lbValue e = lb_build_expr(p, ta->expr);
  3117. Type *t = type_deref(e.type);
  3118. if (is_type_union(t)) {
  3119. if (ta->ignores[0]) {
  3120. // NOTE(bill): This is not needed for optimization levels other than 0
  3121. return lb_emit_union_cast_only_ok_check(p, e, type, pos);
  3122. }
  3123. return lb_emit_union_cast(p, e, type, pos);
  3124. } else if (is_type_any(t)) {
  3125. return lb_emit_any_cast(p, e, type, pos);
  3126. } else {
  3127. GB_PANIC("TODO(bill): type assertion %s", type_to_string(e.type));
  3128. }
  3129. case_end;
  3130. case_ast_node(tc, TypeCast, expr);
  3131. lbValue e = lb_build_expr(p, tc->expr);
  3132. switch (tc->token.kind) {
  3133. case Token_cast:
  3134. return lb_emit_conv(p, e, type);
  3135. case Token_transmute:
  3136. return lb_emit_transmute(p, e, type);
  3137. }
  3138. GB_PANIC("Invalid AST TypeCast");
  3139. case_end;
  3140. case_ast_node(ac, AutoCast, expr);
  3141. lbValue value = lb_build_expr(p, ac->expr);
  3142. return lb_emit_conv(p, value, type);
  3143. case_end;
  3144. case_ast_node(ue, UnaryExpr, expr);
  3145. switch (ue->op.kind) {
  3146. case Token_And:
  3147. return lb_build_unary_and(p, expr);
  3148. default:
  3149. {
  3150. lbValue v = lb_build_expr(p, ue->expr);
  3151. return lb_emit_unary_arith(p, ue->op.kind, v, type);
  3152. }
  3153. }
  3154. case_end;
  3155. case_ast_node(be, BinaryExpr, expr);
  3156. return lb_build_binary_expr(p, expr);
  3157. case_end;
  3158. case_ast_node(pl, ProcLit, expr);
  3159. return lb_generate_anonymous_proc_lit(p->module, p->name, expr, p);
  3160. case_end;
  3161. case_ast_node(cl, CompoundLit, expr);
  3162. return lb_addr_load(p, lb_build_addr(p, expr));
  3163. case_end;
  3164. case_ast_node(ce, CallExpr, expr);
  3165. return lb_build_call_expr(p, expr);
  3166. case_end;
  3167. case_ast_node(se, SliceExpr, expr);
  3168. if (is_type_slice(type_of_expr(se->expr))) {
  3169. // NOTE(bill): Quick optimization
  3170. if (se->high == nullptr &&
  3171. (se->low == nullptr || lb_is_expr_constant_zero(se->low))) {
  3172. return lb_build_expr(p, se->expr);
  3173. }
  3174. }
  3175. return lb_addr_load(p, lb_build_addr(p, expr));
  3176. case_end;
  3177. case_ast_node(ie, IndexExpr, expr);
  3178. return lb_addr_load(p, lb_build_addr(p, expr));
  3179. case_end;
  3180. case_ast_node(ie, MatrixIndexExpr, expr);
  3181. return lb_addr_load(p, lb_build_addr(p, expr));
  3182. case_end;
  3183. case_ast_node(ia, InlineAsmExpr, expr);
  3184. Type *t = type_of_expr(expr);
  3185. GB_ASSERT(is_type_asm_proc(t));
  3186. String asm_string = {};
  3187. String constraints_string = {};
  3188. TypeAndValue tav;
  3189. tav = type_and_value_of_expr(ia->asm_string);
  3190. GB_ASSERT(is_type_string(tav.type));
  3191. GB_ASSERT(tav.value.kind == ExactValue_String);
  3192. asm_string = tav.value.value_string;
  3193. tav = type_and_value_of_expr(ia->constraints_string);
  3194. GB_ASSERT(is_type_string(tav.type));
  3195. GB_ASSERT(tav.value.kind == ExactValue_String);
  3196. constraints_string = tav.value.value_string;
  3197. LLVMInlineAsmDialect dialect = LLVMInlineAsmDialectATT;
  3198. switch (ia->dialect) {
  3199. case InlineAsmDialect_Default: dialect = LLVMInlineAsmDialectATT; break;
  3200. case InlineAsmDialect_ATT: dialect = LLVMInlineAsmDialectATT; break;
  3201. case InlineAsmDialect_Intel: dialect = LLVMInlineAsmDialectIntel; break;
  3202. default: GB_PANIC("Unhandled inline asm dialect"); break;
  3203. }
  3204. LLVMTypeRef func_type = lb_type_internal_for_procedures_raw(p->module, t);
  3205. LLVMValueRef the_asm = llvm_get_inline_asm(func_type, asm_string, constraints_string, ia->has_side_effects, ia->has_side_effects, dialect);
  3206. GB_ASSERT(the_asm != nullptr);
  3207. return {the_asm, t};
  3208. case_end;
  3209. }
  3210. GB_PANIC("lb_build_expr: %.*s", LIT(ast_strings[expr->kind]));
  3211. return {};
  3212. }
  3213. gb_internal lbAddr lb_get_soa_variable_addr(lbProcedure *p, Entity *e) {
  3214. return map_must_get(&p->module->soa_values, e);
  3215. }
  3216. gb_internal lbValue lb_get_using_variable(lbProcedure *p, Entity *e) {
  3217. GB_ASSERT(e->kind == Entity_Variable && e->flags & EntityFlag_Using);
  3218. String name = e->token.string;
  3219. Entity *parent = e->using_parent;
  3220. Selection sel = lookup_field(parent->type, name, false);
  3221. GB_ASSERT(sel.entity != nullptr);
  3222. lbValue *pv = map_get(&p->module->values, parent);
  3223. lbValue v = {};
  3224. bool is_soa = false;
  3225. if (pv == nullptr && parent->flags & EntityFlag_SoaPtrField) {
  3226. is_soa = true;
  3227. // NOTE(bill): using SOA value (probably from for-in statement)
  3228. lbAddr parent_addr = lb_get_soa_variable_addr(p, parent);
  3229. v = lb_addr_get_ptr(p, parent_addr);
  3230. } else if (pv != nullptr) {
  3231. v = *pv;
  3232. } else {
  3233. GB_ASSERT_MSG(e->using_expr != nullptr, "%.*s", LIT(name));
  3234. v = lb_build_addr_ptr(p, e->using_expr);
  3235. }
  3236. GB_ASSERT(v.value != nullptr);
  3237. GB_ASSERT_MSG(is_soa || parent->type == type_deref(v.type), "%s %s", type_to_string(parent->type), type_to_string(v.type));
  3238. lbValue ptr = lb_emit_deep_field_gep(p, v, sel);
  3239. if (parent->scope) {
  3240. if ((parent->scope->flags & (ScopeFlag_File|ScopeFlag_Pkg)) == 0) {
  3241. lb_add_debug_local_variable(p, ptr.value, e->type, e->token);
  3242. }
  3243. } else {
  3244. lb_add_debug_local_variable(p, ptr.value, e->type, e->token);
  3245. }
  3246. return ptr;
  3247. }
  3248. gb_internal lbAddr lb_build_addr_from_entity(lbProcedure *p, Entity *e, Ast *expr) {
  3249. GB_ASSERT(e != nullptr);
  3250. if (e->kind == Entity_Constant) {
  3251. Type *t = default_type(type_of_expr(expr));
  3252. lbValue v = lb_const_value(p->module, t, e->Constant.value);
  3253. if (LLVMIsConstant(v.value)) {
  3254. lbAddr g = lb_add_global_generated(p->module, t, v);
  3255. return g;
  3256. }
  3257. GB_ASSERT(LLVMIsALoadInst(v.value));
  3258. lbValue ptr = {};
  3259. ptr.value = LLVMGetOperand(v.value, 0);
  3260. ptr.type = alloc_type_pointer(t);
  3261. return lb_addr(ptr);
  3262. }
  3263. lbValue v = {};
  3264. lbValue *found = map_get(&p->module->values, e);
  3265. if (found) {
  3266. v = *found;
  3267. } else if (e->kind == Entity_Variable && e->flags & EntityFlag_Using) {
  3268. // NOTE(bill): Calculate the using variable every time
  3269. v = lb_get_using_variable(p, e);
  3270. } else if (e->flags & EntityFlag_SoaPtrField) {
  3271. return lb_get_soa_variable_addr(p, e);
  3272. }
  3273. if (v.value == nullptr) {
  3274. return lb_addr(lb_find_value_from_entity(p->module, e));
  3275. // error(expr, "%.*s Unknown value: %.*s, entity: %p %.*s",
  3276. // LIT(p->name),
  3277. // LIT(e->token.string), e, LIT(entity_strings[e->kind]));
  3278. // GB_PANIC("Unknown value");
  3279. }
  3280. return lb_addr(v);
  3281. }
  3282. gb_internal lbAddr lb_build_array_swizzle_addr(lbProcedure *p, AstCallExpr *ce, TypeAndValue const &tv) {
  3283. isize index_count = ce->args.count-1;
  3284. lbAddr addr = lb_build_addr(p, ce->args[0]);
  3285. if (index_count == 0) {
  3286. return addr;
  3287. }
  3288. Type *type = base_type(lb_addr_type(addr));
  3289. GB_ASSERT(type->kind == Type_Array);
  3290. i64 count = type->Array.count;
  3291. if (count <= 4 && index_count <= 4) {
  3292. u8 indices[4] = {};
  3293. u8 index_count = 0;
  3294. for (i32 i = 1; i < ce->args.count; i++) {
  3295. TypeAndValue tv = type_and_value_of_expr(ce->args[i]);
  3296. GB_ASSERT(is_type_integer(tv.type));
  3297. GB_ASSERT(tv.value.kind == ExactValue_Integer);
  3298. i64 src_index = big_int_to_i64(&tv.value.value_integer);
  3299. indices[index_count++] = cast(u8)src_index;
  3300. }
  3301. return lb_addr_swizzle(lb_addr_get_ptr(p, addr), tv.type, index_count, indices);
  3302. }
  3303. auto indices = slice_make<i32>(permanent_allocator(), ce->args.count-1);
  3304. isize index_index = 0;
  3305. for (i32 i = 1; i < ce->args.count; i++) {
  3306. TypeAndValue tv = type_and_value_of_expr(ce->args[i]);
  3307. GB_ASSERT(is_type_integer(tv.type));
  3308. GB_ASSERT(tv.value.kind == ExactValue_Integer);
  3309. i64 src_index = big_int_to_i64(&tv.value.value_integer);
  3310. indices[index_index++] = cast(i32)src_index;
  3311. }
  3312. return lb_addr_swizzle_large(lb_addr_get_ptr(p, addr), tv.type, indices);
  3313. }
  3314. gb_internal lbAddr lb_build_addr_internal(lbProcedure *p, Ast *expr);
  3315. gb_internal lbAddr lb_build_addr(lbProcedure *p, Ast *expr) {
  3316. expr = unparen_expr(expr);
  3317. // IMPORTANT NOTE(bill):
  3318. // Selector Call Expressions (foo->bar(...))
  3319. // must only evaluate `foo` once as it gets transformed into
  3320. // `foo.bar(foo, ...)`
  3321. // And if `foo` is a procedure call or something more complex, storing the value
  3322. // once is a very good idea
  3323. // If a stored value is found, it must be removed from the cache
  3324. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  3325. lbAddr *pp = map_get(&p->selector_addr, expr);
  3326. if (pp != nullptr) {
  3327. lbAddr res = *pp;
  3328. map_remove(&p->selector_addr, expr);
  3329. return res;
  3330. }
  3331. }
  3332. lbAddr addr = lb_build_addr_internal(p, expr);
  3333. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  3334. map_set(&p->selector_addr, expr, addr);
  3335. }
  3336. return addr;
  3337. }
  3338. gb_internal void lb_build_addr_compound_lit_populate(lbProcedure *p, Slice<Ast *> const &elems, Array<lbCompoundLitElemTempData> *temp_data, Type *compound_type) {
  3339. Type *bt = base_type(compound_type);
  3340. Type *et = nullptr;
  3341. switch (bt->kind) {
  3342. case Type_Array: et = bt->Array.elem; break;
  3343. case Type_EnumeratedArray: et = bt->EnumeratedArray.elem; break;
  3344. case Type_Slice: et = bt->Slice.elem; break;
  3345. case Type_BitSet: et = bt->BitSet.elem; break;
  3346. case Type_DynamicArray: et = bt->DynamicArray.elem; break;
  3347. case Type_SimdVector: et = bt->SimdVector.elem; break;
  3348. case Type_Matrix: et = bt->Matrix.elem; break;
  3349. }
  3350. GB_ASSERT(et != nullptr);
  3351. // NOTE(bill): Separate value, gep, store into their own chunks
  3352. for_array(i, elems) {
  3353. Ast *elem = elems[i];
  3354. if (elem->kind == Ast_FieldValue) {
  3355. ast_node(fv, FieldValue, elem);
  3356. if (bt->kind != Type_DynamicArray && lb_is_elem_const(fv->value, et)) {
  3357. continue;
  3358. }
  3359. if (is_ast_range(fv->field)) {
  3360. ast_node(ie, BinaryExpr, fv->field);
  3361. TypeAndValue lo_tav = ie->left->tav;
  3362. TypeAndValue hi_tav = ie->right->tav;
  3363. GB_ASSERT(lo_tav.mode == Addressing_Constant);
  3364. GB_ASSERT(hi_tav.mode == Addressing_Constant);
  3365. TokenKind op = ie->op.kind;
  3366. i64 lo = exact_value_to_i64(lo_tav.value);
  3367. i64 hi = exact_value_to_i64(hi_tav.value);
  3368. if (op != Token_RangeHalf) {
  3369. hi += 1;
  3370. }
  3371. lbValue value = lb_emit_conv(p, lb_build_expr(p, fv->value), et);
  3372. GB_ASSERT((hi-lo) > 0);
  3373. if (bt->kind == Type_Matrix) {
  3374. for (i64 k = lo; k < hi; k++) {
  3375. lbCompoundLitElemTempData data = {};
  3376. data.value = value;
  3377. data.elem_index = matrix_row_major_index_to_offset(bt, k);
  3378. array_add(temp_data, data);
  3379. }
  3380. } else {
  3381. enum {MAX_ELEMENT_AMOUNT = 32};
  3382. if ((hi-lo) <= MAX_ELEMENT_AMOUNT) {
  3383. for (i64 k = lo; k < hi; k++) {
  3384. lbCompoundLitElemTempData data = {};
  3385. data.value = value;
  3386. data.elem_index = k;
  3387. array_add(temp_data, data);
  3388. }
  3389. } else {
  3390. lbCompoundLitElemTempData data = {};
  3391. data.value = value;
  3392. data.elem_index = lo;
  3393. data.elem_length = hi-lo;
  3394. array_add(temp_data, data);
  3395. }
  3396. }
  3397. } else {
  3398. auto tav = fv->field->tav;
  3399. GB_ASSERT(tav.mode == Addressing_Constant);
  3400. i64 index = exact_value_to_i64(tav.value);
  3401. lbValue value = lb_emit_conv(p, lb_build_expr(p, fv->value), et);
  3402. GB_ASSERT(!is_type_tuple(value.type));
  3403. lbCompoundLitElemTempData data = {};
  3404. data.value = value;
  3405. data.expr = fv->value;
  3406. if (bt->kind == Type_Matrix) {
  3407. data.elem_index = matrix_row_major_index_to_offset(bt, index);
  3408. } else {
  3409. data.elem_index = index;
  3410. }
  3411. array_add(temp_data, data);
  3412. }
  3413. } else {
  3414. if (bt->kind != Type_DynamicArray && lb_is_elem_const(elem, et)) {
  3415. continue;
  3416. }
  3417. lbValue field_expr = lb_build_expr(p, elem);
  3418. GB_ASSERT(!is_type_tuple(field_expr.type));
  3419. lbValue ev = lb_emit_conv(p, field_expr, et);
  3420. lbCompoundLitElemTempData data = {};
  3421. data.value = ev;
  3422. if (bt->kind == Type_Matrix) {
  3423. data.elem_index = matrix_row_major_index_to_offset(bt, i);
  3424. } else {
  3425. data.elem_index = i;
  3426. }
  3427. array_add(temp_data, data);
  3428. }
  3429. }
  3430. }
  3431. gb_internal void lb_build_addr_compound_lit_assign_array(lbProcedure *p, Array<lbCompoundLitElemTempData> const &temp_data) {
  3432. for (auto const &td : temp_data) {
  3433. if (td.value.value != nullptr) {
  3434. if (td.elem_length > 0) {
  3435. auto loop_data = lb_loop_start(p, cast(isize)td.elem_length, t_i32);
  3436. {
  3437. lbValue dst = td.gep;
  3438. dst = lb_emit_ptr_offset(p, dst, loop_data.idx);
  3439. lb_emit_store(p, dst, td.value);
  3440. }
  3441. lb_loop_end(p, loop_data);
  3442. } else {
  3443. lb_emit_store(p, td.gep, td.value);
  3444. }
  3445. }
  3446. }
  3447. }
  3448. gb_internal lbAddr lb_build_addr_index_expr(lbProcedure *p, Ast *expr) {
  3449. ast_node(ie, IndexExpr, expr);
  3450. Type *t = base_type(type_of_expr(ie->expr));
  3451. bool deref = is_type_pointer(t);
  3452. t = base_type(type_deref(t));
  3453. if (is_type_soa_struct(t)) {
  3454. // SOA STRUCTURES!!!!
  3455. lbValue val = lb_build_addr_ptr(p, ie->expr);
  3456. if (deref) {
  3457. val = lb_emit_load(p, val);
  3458. }
  3459. lbValue index = lb_build_expr(p, ie->index);
  3460. return lb_addr_soa_variable(val, index, ie->index);
  3461. }
  3462. if (ie->expr->tav.mode == Addressing_SoaVariable) {
  3463. // SOA Structures for slices/dynamic arrays
  3464. GB_ASSERT_MSG(is_type_multi_pointer(type_of_expr(ie->expr)), "%s", type_to_string(type_of_expr(ie->expr)));
  3465. lbValue field = lb_build_expr(p, ie->expr);
  3466. lbValue index = lb_build_expr(p, ie->index);
  3467. if (!build_context.no_bounds_check) {
  3468. Ast *se_expr = unparen_expr(ie->expr);
  3469. if (se_expr->kind == Ast_SelectorExpr) {
  3470. ast_node(se, SelectorExpr, se_expr);
  3471. lbValue len = {};
  3472. Type *type = base_type(type_deref(type_of_expr(se->expr)));
  3473. GB_ASSERT_MSG(is_type_soa_struct(type), "%s", type_to_string(type));
  3474. if (type->Struct.soa_kind == StructSoa_Fixed) {
  3475. len = lb_const_int(p->module, t_int, type->Struct.soa_count);
  3476. } else {
  3477. lbAddr *found = map_get(&p->selector_addr, se_expr);
  3478. if (found) {
  3479. lbAddr addr = *found;
  3480. lbValue parent = lb_addr_get_ptr(p, addr);
  3481. if (is_type_pointer(type_deref(parent.type))) {
  3482. parent = lb_emit_load(p, parent);
  3483. }
  3484. len = lb_soa_struct_len(p, parent);
  3485. }
  3486. }
  3487. if (len.value) {
  3488. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3489. }
  3490. } else {
  3491. // TODO(bill): how do you even do bounds checking here?
  3492. }
  3493. }
  3494. lbValue val = lb_emit_ptr_offset(p, field, index);
  3495. return lb_addr(val);
  3496. }
  3497. GB_ASSERT_MSG(is_type_indexable(t), "%s %s", type_to_string(t), expr_to_string(expr));
  3498. if (is_type_map(t)) {
  3499. lbAddr map_addr = lb_build_addr(p, ie->expr);
  3500. lbValue key = lb_build_expr(p, ie->index);
  3501. key = lb_emit_conv(p, key, t->Map.key);
  3502. Type *result_type = type_of_expr(expr);
  3503. lbValue map_ptr = lb_addr_get_ptr(p, map_addr);
  3504. if (is_type_pointer(type_deref(map_ptr.type))) {
  3505. map_ptr = lb_emit_load(p, map_ptr);
  3506. }
  3507. return lb_addr_map(map_ptr, key, t, result_type);
  3508. }
  3509. switch (t->kind) {
  3510. case Type_Array: {
  3511. lbValue array = {};
  3512. array = lb_build_addr_ptr(p, ie->expr);
  3513. if (deref) {
  3514. array = lb_emit_load(p, array);
  3515. }
  3516. lbValue index = lb_build_expr(p, ie->index);
  3517. index = lb_emit_conv(p, index, t_int);
  3518. lbValue elem = lb_emit_array_ep(p, array, index);
  3519. auto index_tv = type_and_value_of_expr(ie->index);
  3520. if (index_tv.mode != Addressing_Constant) {
  3521. lbValue len = lb_const_int(p->module, t_int, t->Array.count);
  3522. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3523. }
  3524. return lb_addr(elem);
  3525. }
  3526. case Type_EnumeratedArray: {
  3527. lbValue array = {};
  3528. array = lb_build_addr_ptr(p, ie->expr);
  3529. if (deref) {
  3530. array = lb_emit_load(p, array);
  3531. }
  3532. Type *index_type = t->EnumeratedArray.index;
  3533. auto index_tv = type_and_value_of_expr(ie->index);
  3534. lbValue index = {};
  3535. if (compare_exact_values(Token_NotEq, *t->EnumeratedArray.min_value, exact_value_i64(0))) {
  3536. if (index_tv.mode == Addressing_Constant) {
  3537. ExactValue idx = exact_value_sub(index_tv.value, *t->EnumeratedArray.min_value);
  3538. index = lb_const_value(p->module, index_type, idx);
  3539. } else {
  3540. index = lb_emit_arith(p, Token_Sub,
  3541. lb_build_expr(p, ie->index),
  3542. lb_const_value(p->module, index_type, *t->EnumeratedArray.min_value),
  3543. index_type);
  3544. index = lb_emit_conv(p, index, t_int);
  3545. }
  3546. } else {
  3547. index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3548. }
  3549. lbValue elem = lb_emit_array_ep(p, array, index);
  3550. if (index_tv.mode != Addressing_Constant) {
  3551. lbValue len = lb_const_int(p->module, t_int, t->EnumeratedArray.count);
  3552. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3553. }
  3554. return lb_addr(elem);
  3555. }
  3556. case Type_Slice: {
  3557. lbValue slice = {};
  3558. slice = lb_build_expr(p, ie->expr);
  3559. if (deref) {
  3560. slice = lb_emit_load(p, slice);
  3561. }
  3562. lbValue elem = lb_slice_elem(p, slice);
  3563. lbValue index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3564. lbValue len = lb_slice_len(p, slice);
  3565. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3566. lbValue v = lb_emit_ptr_offset(p, elem, index);
  3567. return lb_addr(v);
  3568. }
  3569. case Type_MultiPointer: {
  3570. lbValue multi_ptr = {};
  3571. multi_ptr = lb_build_expr(p, ie->expr);
  3572. if (deref) {
  3573. multi_ptr = lb_emit_load(p, multi_ptr);
  3574. }
  3575. lbValue index = lb_build_expr(p, ie->index);
  3576. index = lb_emit_conv(p, index, t_int);
  3577. lbValue v = {};
  3578. LLVMValueRef indices[1] = {index.value};
  3579. v.value = LLVMBuildGEP2(p->builder, lb_type(p->module, t->MultiPointer.elem), multi_ptr.value, indices, 1, "");
  3580. v.type = alloc_type_pointer(t->MultiPointer.elem);
  3581. return lb_addr(v);
  3582. }
  3583. case Type_RelativeMultiPointer: {
  3584. lbAddr rel_ptr_addr = {};
  3585. if (deref) {
  3586. lbValue rel_ptr_ptr = lb_build_expr(p, ie->expr);
  3587. rel_ptr_addr = lb_addr(rel_ptr_ptr);
  3588. } else {
  3589. rel_ptr_addr = lb_build_addr(p, ie->expr);
  3590. }
  3591. lbValue rel_ptr = lb_relative_pointer_to_pointer(p, rel_ptr_addr);
  3592. lbValue index = lb_build_expr(p, ie->index);
  3593. index = lb_emit_conv(p, index, t_int);
  3594. lbValue v = {};
  3595. Type *pointer_type = base_type(t->RelativeMultiPointer.pointer_type);
  3596. GB_ASSERT(pointer_type->kind == Type_MultiPointer);
  3597. Type *elem = pointer_type->MultiPointer.elem;
  3598. LLVMValueRef indices[1] = {index.value};
  3599. v.value = LLVMBuildGEP2(p->builder, lb_type(p->module, elem), rel_ptr.value, indices, 1, "");
  3600. v.type = alloc_type_pointer(elem);
  3601. return lb_addr(v);
  3602. }
  3603. case Type_DynamicArray: {
  3604. lbValue dynamic_array = {};
  3605. dynamic_array = lb_build_expr(p, ie->expr);
  3606. if (deref) {
  3607. dynamic_array = lb_emit_load(p, dynamic_array);
  3608. }
  3609. lbValue elem = lb_dynamic_array_elem(p, dynamic_array);
  3610. lbValue len = lb_dynamic_array_len(p, dynamic_array);
  3611. lbValue index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3612. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3613. lbValue v = lb_emit_ptr_offset(p, elem, index);
  3614. return lb_addr(v);
  3615. }
  3616. case Type_Matrix: {
  3617. lbValue matrix = {};
  3618. matrix = lb_build_addr_ptr(p, ie->expr);
  3619. if (deref) {
  3620. matrix = lb_emit_load(p, matrix);
  3621. }
  3622. lbValue index = lb_build_expr(p, ie->index);
  3623. index = lb_emit_conv(p, index, t_int);
  3624. isize bounds_len = 0;
  3625. lbValue elem = {};
  3626. if (t->Matrix.is_row_major) {
  3627. bounds_len = t->Matrix.row_count;
  3628. elem = lb_emit_matrix_ep(p, matrix, index, lb_const_int(p->module, t_int, 0));
  3629. } else {
  3630. bounds_len = t->Matrix.column_count;
  3631. elem = lb_emit_matrix_ep(p, matrix, lb_const_int(p->module, t_int, 0), index);
  3632. }
  3633. elem = lb_emit_conv(p, elem, alloc_type_pointer(type_of_expr(expr)));
  3634. auto index_tv = type_and_value_of_expr(ie->index);
  3635. if (index_tv.mode != Addressing_Constant) {
  3636. lbValue len = lb_const_int(p->module, t_int, bounds_len);
  3637. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3638. }
  3639. return lb_addr(elem);
  3640. }
  3641. case Type_Basic: { // Basic_string
  3642. lbValue str;
  3643. lbValue elem;
  3644. lbValue len;
  3645. lbValue index;
  3646. str = lb_build_expr(p, ie->expr);
  3647. if (deref) {
  3648. str = lb_emit_load(p, str);
  3649. }
  3650. elem = lb_string_elem(p, str);
  3651. len = lb_string_len(p, str);
  3652. index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3653. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3654. return lb_addr(lb_emit_ptr_offset(p, elem, index));
  3655. }
  3656. }
  3657. return {};
  3658. }
  3659. gb_internal lbAddr lb_build_addr_slice_expr(lbProcedure *p, Ast *expr) {
  3660. ast_node(se, SliceExpr, expr);
  3661. lbValue low = lb_const_int(p->module, t_int, 0);
  3662. lbValue high = {};
  3663. if (se->low != nullptr) {
  3664. low = lb_correct_endianness(p, lb_build_expr(p, se->low));
  3665. }
  3666. if (se->high != nullptr) {
  3667. high = lb_correct_endianness(p, lb_build_expr(p, se->high));
  3668. }
  3669. bool no_indices = se->low == nullptr && se->high == nullptr;
  3670. lbAddr addr = lb_build_addr(p, se->expr);
  3671. lbValue base = lb_addr_load(p, addr);
  3672. Type *type = base_type(base.type);
  3673. if (is_type_pointer(type)) {
  3674. type = base_type(type_deref(type));
  3675. addr = lb_addr(base);
  3676. base = lb_addr_load(p, addr);
  3677. }
  3678. switch (type->kind) {
  3679. case Type_Slice: {
  3680. Type *slice_type = type;
  3681. lbValue len = lb_slice_len(p, base);
  3682. if (high.value == nullptr) high = len;
  3683. if (!no_indices) {
  3684. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3685. }
  3686. lbValue elem = lb_emit_ptr_offset(p, lb_slice_elem(p, base), low);
  3687. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3688. lbAddr slice = lb_add_local_generated(p, slice_type, false);
  3689. lb_fill_slice(p, slice, elem, new_len);
  3690. return slice;
  3691. }
  3692. case Type_RelativePointer:
  3693. GB_PANIC("TODO(bill): Type_RelativePointer should be handled above already on the lb_addr_load");
  3694. break;
  3695. case Type_RelativeMultiPointer:
  3696. GB_PANIC("TODO(bill): Type_RelativeMultiPointer should be handled above already on the lb_addr_load");
  3697. break;
  3698. case Type_DynamicArray: {
  3699. Type *elem_type = type->DynamicArray.elem;
  3700. Type *slice_type = alloc_type_slice(elem_type);
  3701. lbValue len = lb_dynamic_array_len(p, base);
  3702. if (high.value == nullptr) high = len;
  3703. if (!no_indices) {
  3704. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3705. }
  3706. lbValue elem = lb_emit_ptr_offset(p, lb_dynamic_array_elem(p, base), low);
  3707. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3708. lbAddr slice = lb_add_local_generated(p, slice_type, false);
  3709. lb_fill_slice(p, slice, elem, new_len);
  3710. return slice;
  3711. }
  3712. case Type_MultiPointer: {
  3713. lbAddr res = lb_add_local_generated(p, type_of_expr(expr), false);
  3714. if (se->high == nullptr) {
  3715. lbValue offset = base;
  3716. LLVMValueRef indices[1] = {low.value};
  3717. offset.value = LLVMBuildGEP2(p->builder, lb_type(p->module, base_type(offset.type)->MultiPointer.elem), offset.value, indices, 1, "");
  3718. lb_addr_store(p, res, offset);
  3719. } else {
  3720. low = lb_emit_conv(p, low, t_int);
  3721. high = lb_emit_conv(p, high, t_int);
  3722. lb_emit_multi_pointer_slice_bounds_check(p, se->open, low, high);
  3723. LLVMValueRef indices[1] = {low.value};
  3724. LLVMValueRef ptr = LLVMBuildGEP2(p->builder, lb_type(p->module, base_type(base.type)->MultiPointer.elem), base.value, indices, 1, "");
  3725. LLVMValueRef len = LLVMBuildSub(p->builder, high.value, low.value, "");
  3726. LLVMValueRef gep0 = lb_emit_struct_ep(p, res.addr, 0).value;
  3727. LLVMValueRef gep1 = lb_emit_struct_ep(p, res.addr, 1).value;
  3728. LLVMBuildStore(p->builder, ptr, gep0);
  3729. LLVMBuildStore(p->builder, len, gep1);
  3730. }
  3731. return res;
  3732. }
  3733. case Type_Array: {
  3734. Type *slice_type = alloc_type_slice(type->Array.elem);
  3735. lbValue len = lb_const_int(p->module, t_int, type->Array.count);
  3736. if (high.value == nullptr) high = len;
  3737. bool low_const = type_and_value_of_expr(se->low).mode == Addressing_Constant;
  3738. bool high_const = type_and_value_of_expr(se->high).mode == Addressing_Constant;
  3739. if (!low_const || !high_const) {
  3740. if (!no_indices) {
  3741. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3742. }
  3743. }
  3744. lbValue elem = lb_emit_ptr_offset(p, lb_array_elem(p, lb_addr_get_ptr(p, addr)), low);
  3745. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3746. lbAddr slice = lb_add_local_generated(p, slice_type, false);
  3747. lb_fill_slice(p, slice, elem, new_len);
  3748. return slice;
  3749. }
  3750. case Type_Basic: {
  3751. GB_ASSERT_MSG(are_types_identical(type, t_string), "got %s", type_to_string(type));
  3752. lbValue len = lb_string_len(p, base);
  3753. if (high.value == nullptr) high = len;
  3754. if (!no_indices) {
  3755. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3756. }
  3757. lbValue elem = lb_emit_ptr_offset(p, lb_string_elem(p, base), low);
  3758. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3759. lbAddr str = lb_add_local_generated(p, t_string, false);
  3760. lb_fill_string(p, str, elem, new_len);
  3761. return str;
  3762. }
  3763. case Type_Struct:
  3764. if (is_type_soa_struct(type)) {
  3765. lbValue len = lb_soa_struct_len(p, lb_addr_get_ptr(p, addr));
  3766. if (high.value == nullptr) high = len;
  3767. if (!no_indices) {
  3768. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3769. }
  3770. #if 1
  3771. lbAddr dst = lb_add_local_generated(p, type_of_expr(expr), true);
  3772. if (type->Struct.soa_kind == StructSoa_Fixed) {
  3773. i32 field_count = cast(i32)type->Struct.fields.count;
  3774. for (i32 i = 0; i < field_count; i++) {
  3775. lbValue field_dst = lb_emit_struct_ep(p, dst.addr, i);
  3776. lbValue field_src = lb_emit_struct_ep(p, lb_addr_get_ptr(p, addr), i);
  3777. field_src = lb_emit_array_ep(p, field_src, low);
  3778. field_src = lb_emit_conv(p, field_src, type_deref(field_dst.type));
  3779. lb_emit_store(p, field_dst, field_src);
  3780. }
  3781. lbValue len_dst = lb_emit_struct_ep(p, dst.addr, field_count);
  3782. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3783. lb_emit_store(p, len_dst, new_len);
  3784. } else if (type->Struct.soa_kind == StructSoa_Slice) {
  3785. if (no_indices) {
  3786. lb_addr_store(p, dst, base);
  3787. } else {
  3788. i32 field_count = cast(i32)type->Struct.fields.count - 1;
  3789. for (i32 i = 0; i < field_count; i++) {
  3790. lbValue field_dst = lb_emit_struct_ep(p, dst.addr, i);
  3791. lbValue field_src = lb_emit_struct_ev(p, base, i);
  3792. field_src = lb_emit_ptr_offset(p, field_src, low);
  3793. field_src = lb_emit_conv(p, field_src, type_deref(field_dst.type));
  3794. lb_emit_store(p, field_dst, field_src);
  3795. }
  3796. lbValue len_dst = lb_emit_struct_ep(p, dst.addr, field_count);
  3797. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3798. lb_emit_store(p, len_dst, new_len);
  3799. }
  3800. } else if (type->Struct.soa_kind == StructSoa_Dynamic) {
  3801. i32 field_count = cast(i32)type->Struct.fields.count - 3;
  3802. for (i32 i = 0; i < field_count; i++) {
  3803. lbValue field_dst = lb_emit_struct_ep(p, dst.addr, i);
  3804. lbValue field_src = lb_emit_struct_ev(p, base, i);
  3805. field_src = lb_emit_ptr_offset(p, field_src, low);
  3806. field_src = lb_emit_conv(p, field_src, type_deref(field_dst.type));
  3807. lb_emit_store(p, field_dst, field_src);
  3808. }
  3809. lbValue len_dst = lb_emit_struct_ep(p, dst.addr, field_count);
  3810. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3811. lb_emit_store(p, len_dst, new_len);
  3812. }
  3813. return dst;
  3814. #endif
  3815. }
  3816. break;
  3817. }
  3818. GB_PANIC("Unknown slicable type");
  3819. return {};
  3820. }
  3821. gb_internal lbAddr lb_build_addr_compound_lit(lbProcedure *p, Ast *expr) {
  3822. ast_node(cl, CompoundLit, expr);
  3823. Type *type = type_of_expr(expr);
  3824. Type *bt = base_type(type);
  3825. lbAddr v = lb_add_local_generated(p, type, true);
  3826. TEMPORARY_ALLOCATOR_GUARD();
  3827. Type *et = nullptr;
  3828. switch (bt->kind) {
  3829. case Type_Array: et = bt->Array.elem; break;
  3830. case Type_EnumeratedArray: et = bt->EnumeratedArray.elem; break;
  3831. case Type_Slice: et = bt->Slice.elem; break;
  3832. case Type_BitSet: et = bt->BitSet.elem; break;
  3833. case Type_SimdVector: et = bt->SimdVector.elem; break;
  3834. case Type_Matrix: et = bt->Matrix.elem; break;
  3835. }
  3836. String proc_name = {};
  3837. if (p->entity) {
  3838. proc_name = p->entity->token.string;
  3839. }
  3840. TokenPos pos = ast_token(expr).pos;
  3841. switch (bt->kind) {
  3842. default: GB_PANIC("Unknown CompoundLit type: %s", type_to_string(type)); break;
  3843. case Type_BitField: {
  3844. TEMPORARY_ALLOCATOR_GUARD();
  3845. // Type *backing_type = core_type(bt->BitField.backing_type);
  3846. struct FieldData {
  3847. Type *field_type;
  3848. u64 bit_offset;
  3849. u64 bit_size;
  3850. };
  3851. auto values = array_make<lbValue>(temporary_allocator(), 0, cl->elems.count);
  3852. auto fields = array_make<FieldData>(temporary_allocator(), 0, cl->elems.count);
  3853. for (Ast *elem : cl->elems) {
  3854. ast_node(fv, FieldValue, elem);
  3855. String name = fv->field->Ident.token.string;
  3856. Selection sel = lookup_field(bt, name, false);
  3857. GB_ASSERT(sel.is_bit_field);
  3858. GB_ASSERT(!sel.indirect);
  3859. GB_ASSERT(sel.index.count == 1);
  3860. GB_ASSERT(sel.entity != nullptr);
  3861. i64 index = sel.index[0];
  3862. Entity *f = bt->BitField.fields[index];
  3863. GB_ASSERT(f == sel.entity);
  3864. i64 bit_offset = bt->BitField.bit_offsets[index];
  3865. i64 bit_size = bt->BitField.bit_sizes[index];
  3866. GB_ASSERT(bit_size > 0);
  3867. Type *field_type = sel.entity->type;
  3868. lbValue field_expr = lb_build_expr(p, fv->value);
  3869. field_expr = lb_emit_conv(p, field_expr, field_type);
  3870. array_add(&values, field_expr);
  3871. array_add(&fields, FieldData{field_type, cast(u64)bit_offset, cast(u64)bit_size});
  3872. }
  3873. // NOTE(bill): inline insertion sort should be good enough, right?
  3874. for (isize i = 1; i < values.count; i++) {
  3875. for (isize j = i;
  3876. j > 0 && fields[i].bit_offset < fields[j].bit_offset;
  3877. j--) {
  3878. auto vtmp = values[j];
  3879. values[j] = values[j-1];
  3880. values[j-1] = vtmp;
  3881. auto ftmp = fields[j];
  3882. fields[j] = fields[j-1];
  3883. fields[j-1] = ftmp;
  3884. }
  3885. }
  3886. bool any_fields_different_endian = false;
  3887. for (auto const &f : fields) {
  3888. if (is_type_different_to_arch_endianness(f.field_type)) {
  3889. // NOTE(bill): Just be slow for this, to be correct
  3890. any_fields_different_endian = true;
  3891. break;
  3892. }
  3893. }
  3894. if (!any_fields_different_endian &&
  3895. fields.count == bt->BitField.fields.count) {
  3896. // SINGLE INTEGER BACKING ONLY
  3897. Type *backing_type = core_type(bt->BitField.backing_type);
  3898. GB_ASSERT(is_type_integer(backing_type) ||
  3899. (is_type_array(backing_type) && is_type_integer(backing_type->Array.elem)));
  3900. // NOTE(bill): all fields are present
  3901. // this means no masking is necessary since on write, the bits will be overridden
  3902. lbValue dst_byte_ptr = lb_emit_conv(p, v.addr, t_u8_ptr);
  3903. u64 total_bit_size = cast(u64)(8*type_size_of(bt));
  3904. if (is_type_integer(backing_type)) {
  3905. LLVMTypeRef lit = lb_type(p->module, backing_type);
  3906. LLVMValueRef res = LLVMConstInt(lit, 0, false);
  3907. for (isize i = 0; i < fields.count; i++) {
  3908. auto const &f = fields[i];
  3909. LLVMValueRef mask = LLVMConstInt(lit, 1, false);
  3910. mask = LLVMConstShl(mask, LLVMConstInt(lit, f.bit_size, false));
  3911. mask = LLVMConstSub(mask, LLVMConstInt(lit, 1, false));
  3912. LLVMValueRef elem = values[i].value;
  3913. if (lb_sizeof(lit) < lb_sizeof(LLVMTypeOf(elem))) {
  3914. elem = LLVMBuildTrunc(p->builder, elem, lit, "");
  3915. } else {
  3916. elem = LLVMBuildZExt(p->builder, elem, lit, "");
  3917. }
  3918. elem = LLVMBuildAnd(p->builder, elem, mask, "");
  3919. elem = LLVMBuildShl(p->builder, elem, LLVMConstInt(lit, f.bit_offset, false), "");
  3920. res = LLVMBuildOr(p->builder, res, elem, "");
  3921. }
  3922. LLVMBuildStore(p->builder, res, v.addr.value);
  3923. } else if (is_type_array(backing_type)) {
  3924. // ARRAY OF INTEGER BACKING
  3925. i64 array_count = backing_type->Array.count;
  3926. LLVMTypeRef lit = lb_type(p->module, core_type(backing_type->Array.elem));
  3927. gb_unused(array_count);
  3928. gb_unused(lit);
  3929. LLVMValueRef *elems = gb_alloc_array(temporary_allocator(), LLVMValueRef, array_count);
  3930. for (i64 i = 0; i < array_count; i++) {
  3931. elems[i] = LLVMConstInt(lit, 0, false);
  3932. }
  3933. u64 elem_bit_size = cast(u64)(8*type_size_of(backing_type->Array.elem));
  3934. u64 curr_bit_offset = 0;
  3935. for (isize i = 0; i < fields.count; i++) {
  3936. auto const &f = fields[i];
  3937. LLVMValueRef val = values[i].value;
  3938. LLVMTypeRef vt = lb_type(p->module, values[i].type);
  3939. for (u64 bits_to_set = f.bit_size;
  3940. bits_to_set > 0;
  3941. /**/) {
  3942. i64 elem_idx = curr_bit_offset/elem_bit_size;
  3943. u64 elem_bit_offset = curr_bit_offset%elem_bit_size;
  3944. u64 mask_width = gb_min(bits_to_set, elem_bit_size-elem_bit_offset);
  3945. GB_ASSERT(mask_width > 0);
  3946. bits_to_set -= mask_width;
  3947. LLVMValueRef mask = LLVMConstInt(vt, 1, false);
  3948. mask = LLVMConstShl(mask, LLVMConstInt(vt, mask_width, false));
  3949. mask = LLVMConstSub(mask, LLVMConstInt(vt, 1, false));
  3950. LLVMValueRef to_set = LLVMBuildAnd(p->builder, val, mask, "");
  3951. if (elem_bit_offset != 0) {
  3952. to_set = LLVMBuildShl(p->builder, to_set, LLVMConstInt(vt, elem_bit_offset, false), "");
  3953. }
  3954. to_set = LLVMBuildTrunc(p->builder, to_set, lit, "");
  3955. if (LLVMIsNull(elems[elem_idx])) {
  3956. elems[elem_idx] = to_set; // don't even bother doing `0 | to_set`
  3957. } else {
  3958. elems[elem_idx] = LLVMBuildOr(p->builder, elems[elem_idx], to_set, "");
  3959. }
  3960. if (mask_width != 0) {
  3961. val = LLVMBuildLShr(p->builder, val, LLVMConstInt(vt, mask_width, false), "");
  3962. }
  3963. curr_bit_offset += mask_width;
  3964. }
  3965. GB_ASSERT(curr_bit_offset == f.bit_offset + f.bit_size);
  3966. }
  3967. for (i64 i = 0; i < array_count; i++) {
  3968. LLVMValueRef elem_ptr = LLVMBuildStructGEP2(p->builder, lb_type(p->module, backing_type), v.addr.value, cast(unsigned)i, "");
  3969. LLVMBuildStore(p->builder, elems[i], elem_ptr);
  3970. }
  3971. } else {
  3972. // SLOW STORAGE
  3973. for_array(i, fields) {
  3974. auto const &f = fields[i];
  3975. if ((f.bit_offset & 7) == 0) {
  3976. u64 unpacked_bit_size = cast(u64)(8*type_size_of(f.field_type));
  3977. u64 byte_size = (f.bit_size+7)/8;
  3978. if (f.bit_offset + unpacked_bit_size <= total_bit_size) {
  3979. byte_size = unpacked_bit_size/8;
  3980. }
  3981. lbValue dst = lb_emit_ptr_offset(p, dst_byte_ptr, lb_const_int(p->module, t_int, f.bit_offset/8));
  3982. lbValue src = lb_address_from_load_or_generate_local(p, values[i]);
  3983. lb_mem_copy_non_overlapping(p, dst, src, lb_const_int(p->module, t_uintptr, byte_size));
  3984. } else {
  3985. lbAddr dst = lb_addr_bit_field(v.addr, f.field_type, f.bit_offset, f.bit_size);
  3986. lb_addr_store(p, dst, values[i]);
  3987. }
  3988. }
  3989. }
  3990. } else {
  3991. // individual storing
  3992. for_array(i, values) {
  3993. auto const &f = fields[i];
  3994. lbAddr dst = lb_addr_bit_field(v.addr, f.field_type, f.bit_offset, f.bit_size);
  3995. lb_addr_store(p, dst, values[i]);
  3996. }
  3997. }
  3998. return v;
  3999. }
  4000. case Type_Struct: {
  4001. // TODO(bill): "constant" '#raw_union's are not initialized constantly at the moment.
  4002. // NOTE(bill): This is due to the layout of the unions when printed to LLVM-IR
  4003. bool is_raw_union = is_type_raw_union(bt);
  4004. GB_ASSERT(is_type_struct(bt) || is_raw_union);
  4005. TypeStruct *st = &bt->Struct;
  4006. if (cl->elems.count > 0) {
  4007. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4008. lbValue comp_lit_ptr = lb_addr_get_ptr(p, v);
  4009. for_array(field_index, cl->elems) {
  4010. Ast *elem = cl->elems[field_index];
  4011. lbValue field_expr = {};
  4012. Entity *field = nullptr;
  4013. isize index = field_index;
  4014. if (elem->kind == Ast_FieldValue) {
  4015. ast_node(fv, FieldValue, elem);
  4016. String name = fv->field->Ident.token.string;
  4017. Selection sel = lookup_field(bt, name, false);
  4018. GB_ASSERT(!sel.indirect);
  4019. elem = fv->value;
  4020. if (sel.index.count > 1) {
  4021. if (lb_is_nested_possibly_constant(type, sel, elem)) {
  4022. continue;
  4023. }
  4024. field_expr = lb_build_expr(p, elem);
  4025. field_expr = lb_emit_conv(p, field_expr, sel.entity->type);
  4026. if (sel.is_bit_field) {
  4027. Selection sub_sel = trim_selection(sel);
  4028. lbValue trimmed_dst = lb_emit_deep_field_gep(p, comp_lit_ptr, sub_sel);
  4029. Type *bf = base_type(type_deref(trimmed_dst.type));
  4030. if (is_type_pointer(bf)) {
  4031. trimmed_dst = lb_emit_load(p, trimmed_dst);
  4032. bf = base_type(type_deref(trimmed_dst.type));
  4033. }
  4034. GB_ASSERT(bf->kind == Type_BitField);
  4035. isize idx = sel.index[sel.index.count-1];
  4036. lbAddr dst = lb_addr_bit_field(trimmed_dst, bf->BitField.fields[idx]->type, bf->BitField.bit_offsets[idx], bf->BitField.bit_sizes[idx]);
  4037. lb_addr_store(p, dst, field_expr);
  4038. } else {
  4039. lbValue dst = lb_emit_deep_field_gep(p, comp_lit_ptr, sel);
  4040. lb_emit_store(p, dst, field_expr);
  4041. }
  4042. continue;
  4043. }
  4044. index = sel.index[0];
  4045. } else {
  4046. Selection sel = lookup_field_from_index(bt, st->fields[field_index]->Variable.field_index);
  4047. GB_ASSERT(sel.index.count == 1);
  4048. GB_ASSERT(!sel.indirect);
  4049. index = sel.index[0];
  4050. }
  4051. field = st->fields[index];
  4052. Type *ft = field->type;
  4053. if (!is_raw_union && !is_type_typeid(ft) && lb_is_elem_const(elem, ft)) {
  4054. continue;
  4055. }
  4056. field_expr = lb_build_expr(p, elem);
  4057. lbValue gep = {};
  4058. if (is_raw_union) {
  4059. gep = lb_emit_conv(p, comp_lit_ptr, alloc_type_pointer(ft));
  4060. } else {
  4061. gep = lb_emit_struct_ep(p, comp_lit_ptr, cast(i32)index);
  4062. }
  4063. Type *fet = field_expr.type;
  4064. GB_ASSERT(fet->kind != Type_Tuple);
  4065. // HACK TODO(bill): THIS IS A MASSIVE HACK!!!!
  4066. if (is_type_union(ft) && !are_types_identical(fet, ft) && !is_type_untyped(fet)) {
  4067. GB_ASSERT_MSG(union_variant_index(ft, fet) >= 0, "%s", type_to_string(fet));
  4068. lb_emit_store_union_variant(p, gep, field_expr, fet);
  4069. } else {
  4070. lbValue fv = lb_emit_conv(p, field_expr, ft);
  4071. lb_emit_store(p, gep, fv);
  4072. }
  4073. }
  4074. }
  4075. break;
  4076. }
  4077. case Type_Map: {
  4078. if (cl->elems.count == 0) {
  4079. break;
  4080. }
  4081. GB_ASSERT(!build_context.no_dynamic_literals);
  4082. lbValue err = lb_dynamic_map_reserve(p, v.addr, 2*cl->elems.count, pos);
  4083. gb_unused(err);
  4084. for (Ast *elem : cl->elems) {
  4085. ast_node(fv, FieldValue, elem);
  4086. lbValue key = lb_build_expr(p, fv->field);
  4087. lbValue value = lb_build_expr(p, fv->value);
  4088. lb_internal_dynamic_map_set(p, v.addr, type, key, value, elem);
  4089. }
  4090. break;
  4091. }
  4092. case Type_Array: {
  4093. if (cl->elems.count > 0) {
  4094. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4095. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4096. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4097. lbValue dst_ptr = lb_addr_get_ptr(p, v);
  4098. for_array(i, temp_data) {
  4099. i32 index = cast(i32)(temp_data[i].elem_index);
  4100. temp_data[i].gep = lb_emit_array_epi(p, dst_ptr, index);
  4101. }
  4102. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4103. }
  4104. break;
  4105. }
  4106. case Type_EnumeratedArray: {
  4107. if (cl->elems.count > 0) {
  4108. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4109. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4110. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4111. lbValue dst_ptr = lb_addr_get_ptr(p, v);
  4112. i64 index_offset = exact_value_to_i64(*bt->EnumeratedArray.min_value);
  4113. for_array(i, temp_data) {
  4114. i32 index = cast(i32)(temp_data[i].elem_index - index_offset);
  4115. temp_data[i].gep = lb_emit_array_epi(p, dst_ptr, index);
  4116. }
  4117. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4118. }
  4119. break;
  4120. }
  4121. case Type_Slice: {
  4122. if (cl->elems.count > 0) {
  4123. lbValue slice = lb_const_value(p->module, type, exact_value_compound(expr));
  4124. lbValue data = lb_slice_elem(p, slice);
  4125. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4126. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4127. for_array(i, temp_data) {
  4128. temp_data[i].gep = lb_emit_ptr_offset(p, data, lb_const_int(p->module, t_int, temp_data[i].elem_index));
  4129. }
  4130. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4131. {
  4132. lbValue count = {};
  4133. count.type = t_int;
  4134. unsigned len_index = lb_convert_struct_index(p->module, type, 1);
  4135. if (lb_is_const(slice)) {
  4136. unsigned indices[1] = {len_index};
  4137. count.value = llvm_const_extract_value(p->module, slice.value, indices, gb_count_of(indices));
  4138. } else {
  4139. count.value = LLVMBuildExtractValue(p->builder, slice.value, len_index, "");
  4140. }
  4141. lb_fill_slice(p, v, data, count);
  4142. }
  4143. }
  4144. break;
  4145. }
  4146. case Type_DynamicArray: {
  4147. if (cl->elems.count == 0) {
  4148. break;
  4149. }
  4150. GB_ASSERT(!build_context.no_dynamic_literals);
  4151. Type *et = bt->DynamicArray.elem;
  4152. lbValue size = lb_const_int(p->module, t_int, type_size_of(et));
  4153. lbValue align = lb_const_int(p->module, t_int, type_align_of(et));
  4154. i64 item_count = gb_max(cl->max_count, cl->elems.count);
  4155. {
  4156. auto args = array_make<lbValue>(temporary_allocator(), 5);
  4157. args[0] = lb_emit_conv(p, lb_addr_get_ptr(p, v), t_rawptr);
  4158. args[1] = size;
  4159. args[2] = align;
  4160. args[3] = lb_const_int(p->module, t_int, item_count);
  4161. args[4] = lb_emit_source_code_location_as_global(p, proc_name, pos);
  4162. lb_emit_runtime_call(p, "__dynamic_array_reserve", args);
  4163. }
  4164. lbValue items = lb_generate_local_array(p, et, item_count);
  4165. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4166. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4167. for_array(i, temp_data) {
  4168. temp_data[i].gep = lb_emit_array_epi(p, items, temp_data[i].elem_index);
  4169. }
  4170. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4171. {
  4172. auto args = array_make<lbValue>(temporary_allocator(), 6);
  4173. args[0] = lb_emit_conv(p, v.addr, t_rawptr);
  4174. args[1] = size;
  4175. args[2] = align;
  4176. args[3] = lb_emit_conv(p, items, t_rawptr);
  4177. args[4] = lb_const_int(p->module, t_int, item_count);
  4178. args[5] = lb_emit_source_code_location_as_global(p, proc_name, pos);
  4179. lb_emit_runtime_call(p, "__dynamic_array_append", args);
  4180. }
  4181. break;
  4182. }
  4183. case Type_Basic: {
  4184. GB_ASSERT(is_type_any(bt));
  4185. if (cl->elems.count > 0) {
  4186. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4187. String field_names[2] = {
  4188. str_lit("data"),
  4189. str_lit("id"),
  4190. };
  4191. Type *field_types[2] = {
  4192. t_rawptr,
  4193. t_typeid,
  4194. };
  4195. for_array(field_index, cl->elems) {
  4196. Ast *elem = cl->elems[field_index];
  4197. lbValue field_expr = {};
  4198. isize index = field_index;
  4199. if (elem->kind == Ast_FieldValue) {
  4200. ast_node(fv, FieldValue, elem);
  4201. Selection sel = lookup_field(bt, fv->field->Ident.token.string, false);
  4202. index = sel.index[0];
  4203. elem = fv->value;
  4204. } else {
  4205. TypeAndValue tav = type_and_value_of_expr(elem);
  4206. Selection sel = lookup_field(bt, field_names[field_index], false);
  4207. index = sel.index[0];
  4208. }
  4209. field_expr = lb_build_expr(p, elem);
  4210. GB_ASSERT(field_expr.type->kind != Type_Tuple);
  4211. Type *ft = field_types[index];
  4212. lbValue fv = lb_emit_conv(p, field_expr, ft);
  4213. lbValue gep = lb_emit_struct_ep(p, lb_addr_get_ptr(p, v), cast(i32)index);
  4214. lb_emit_store(p, gep, fv);
  4215. }
  4216. }
  4217. break;
  4218. }
  4219. case Type_BitSet: {
  4220. i64 sz = type_size_of(type);
  4221. if (cl->elems.count > 0 && sz > 0) {
  4222. lbValue lower = lb_const_value(p->module, t_int, exact_value_i64(bt->BitSet.lower));
  4223. Type *backing = bit_set_to_int(type);
  4224. if (is_type_array(backing)) {
  4225. GB_PANIC("TODO: bit_set [N]T");
  4226. Type *base_it = core_array_type(backing);
  4227. i64 bits_per_elem = 8*type_size_of(base_it);
  4228. gb_unused(bits_per_elem);
  4229. lbValue one = lb_const_value(p->module, t_i64, exact_value_i64(1));
  4230. for (Ast *elem : cl->elems) {
  4231. GB_ASSERT(elem->kind != Ast_FieldValue);
  4232. lbValue expr = lb_build_expr(p, elem);
  4233. GB_ASSERT(expr.type->kind != Type_Tuple);
  4234. lbValue e = lb_emit_conv(p, expr, t_i64);
  4235. e = lb_emit_arith(p, Token_Sub, e, lower, t_i64);
  4236. // lbValue idx = lb_emit_arith(p, Token_Div, e, bits_per_elem, t_i64);
  4237. // lbValue val = lb_emit_arith(p, Token_Div, e, bits_per_elem, t_i64);
  4238. }
  4239. } else {
  4240. Type *it = bit_set_to_int(bt);
  4241. lbValue one = lb_const_value(p->module, it, exact_value_i64(1));
  4242. for (Ast *elem : cl->elems) {
  4243. GB_ASSERT(elem->kind != Ast_FieldValue);
  4244. lbValue expr = lb_build_expr(p, elem);
  4245. GB_ASSERT(expr.type->kind != Type_Tuple);
  4246. lbValue e = lb_emit_conv(p, expr, it);
  4247. e = lb_emit_arith(p, Token_Sub, e, lower, it);
  4248. e = lb_emit_arith(p, Token_Shl, one, e, it);
  4249. lbValue old_value = lb_emit_transmute(p, lb_addr_load(p, v), it);
  4250. lbValue new_value = lb_emit_arith(p, Token_Or, old_value, e, it);
  4251. new_value = lb_emit_transmute(p, new_value, type);
  4252. lb_addr_store(p, v, new_value);
  4253. }
  4254. }
  4255. }
  4256. break;
  4257. }
  4258. case Type_Matrix: {
  4259. if (cl->elems.count > 0) {
  4260. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4261. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4262. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4263. lbValue dst_ptr = lb_addr_get_ptr(p, v);
  4264. for_array(i, temp_data) {
  4265. temp_data[i].gep = lb_emit_array_epi(p, dst_ptr, temp_data[i].elem_index);
  4266. }
  4267. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4268. }
  4269. break;
  4270. }
  4271. case Type_SimdVector: {
  4272. if (cl->elems.count > 0) {
  4273. lbValue vector_value = lb_const_value(p->module, type, exact_value_compound(expr));
  4274. defer (lb_addr_store(p, v, vector_value));
  4275. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4276. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4277. // TODO(bill): reduce the need for individual `insertelement` if a `shufflevector`
  4278. // might be a better option
  4279. for (auto const &td : temp_data) {
  4280. if (td.value.value != nullptr) {
  4281. if (td.elem_length > 0) {
  4282. for (i64 k = 0; k < td.elem_length; k++) {
  4283. LLVMValueRef index = lb_const_int(p->module, t_u32, td.elem_index + k).value;
  4284. vector_value.value = LLVMBuildInsertElement(p->builder, vector_value.value, td.value.value, index, "");
  4285. }
  4286. } else {
  4287. LLVMValueRef index = lb_const_int(p->module, t_u32, td.elem_index).value;
  4288. vector_value.value = LLVMBuildInsertElement(p->builder, vector_value.value, td.value.value, index, "");
  4289. }
  4290. }
  4291. }
  4292. }
  4293. break;
  4294. }
  4295. }
  4296. return v;
  4297. }
  4298. gb_internal lbAddr lb_build_addr_internal(lbProcedure *p, Ast *expr) {
  4299. switch (expr->kind) {
  4300. case_ast_node(i, Implicit, expr);
  4301. lbAddr v = {};
  4302. switch (i->kind) {
  4303. case Token_context:
  4304. v = lb_find_or_generate_context_ptr(p);
  4305. break;
  4306. }
  4307. GB_ASSERT(v.addr.value != nullptr);
  4308. return v;
  4309. case_end;
  4310. case_ast_node(i, Ident, expr);
  4311. if (is_blank_ident(expr)) {
  4312. lbAddr val = {};
  4313. return val;
  4314. }
  4315. String name = i->token.string;
  4316. Entity *e = entity_of_node(expr);
  4317. return lb_build_addr_from_entity(p, e, expr);
  4318. case_end;
  4319. case_ast_node(se, SelectorExpr, expr);
  4320. Ast *sel_node = unparen_expr(se->selector);
  4321. if (sel_node->kind == Ast_Ident) {
  4322. String selector = sel_node->Ident.token.string;
  4323. TypeAndValue tav = type_and_value_of_expr(se->expr);
  4324. if (tav.mode == Addressing_Invalid) {
  4325. // NOTE(bill): Imports
  4326. Entity *imp = entity_of_node(se->expr);
  4327. if (imp != nullptr) {
  4328. GB_ASSERT(imp->kind == Entity_ImportName);
  4329. }
  4330. return lb_build_addr(p, unparen_expr(se->selector));
  4331. }
  4332. Type *type = base_type(tav.type);
  4333. if (tav.mode == Addressing_Type) { // Addressing_Type
  4334. Selection sel = lookup_field(tav.type, selector, true);
  4335. if (sel.pseudo_field) {
  4336. GB_ASSERT(sel.entity->kind == Entity_Procedure || sel.entity->kind == Entity_ProcGroup);
  4337. Entity *e = entity_of_node(sel_node);
  4338. GB_ASSERT(e->kind == Entity_Procedure);
  4339. return lb_addr(lb_find_value_from_entity(p->module, e));
  4340. }
  4341. GB_PANIC("Unreachable %.*s", LIT(selector));
  4342. }
  4343. if (se->swizzle_count > 0) {
  4344. Type *array_type = base_type(type_deref(tav.type));
  4345. GB_ASSERT(array_type->kind == Type_Array || array_type->kind == Type_SimdVector);
  4346. u8 swizzle_count = se->swizzle_count;
  4347. u8 swizzle_indices_raw = se->swizzle_indices;
  4348. u8 swizzle_indices[4] = {};
  4349. for (u8 i = 0; i < swizzle_count; i++) {
  4350. u8 index = swizzle_indices_raw>>(i*2) & 3;
  4351. swizzle_indices[i] = index;
  4352. }
  4353. lbValue a = {};
  4354. if (is_type_pointer(tav.type)) {
  4355. a = lb_build_expr(p, se->expr);
  4356. } else {
  4357. lbAddr addr = lb_build_addr(p, se->expr);
  4358. a = lb_addr_get_ptr(p, addr);
  4359. }
  4360. Type *type = type_deref(expr->tav.type);
  4361. GB_ASSERT(is_type_array(type) || is_type_simd_vector(type));
  4362. return lb_addr_swizzle(a, type, swizzle_count, swizzle_indices);
  4363. }
  4364. Selection sel = lookup_field(type, selector, false);
  4365. GB_ASSERT(sel.entity != nullptr);
  4366. if (sel.pseudo_field) {
  4367. GB_ASSERT(sel.entity->kind == Entity_Procedure || sel.entity->kind == Entity_ProcGroup);
  4368. Entity *e = entity_of_node(sel_node);
  4369. GB_ASSERT(e->kind == Entity_Procedure);
  4370. return lb_addr(lb_find_value_from_entity(p->module, e));
  4371. }
  4372. if (sel.is_bit_field) {
  4373. lbAddr addr = lb_build_addr(p, se->expr);
  4374. Selection sub_sel = sel;
  4375. sub_sel.index.count -= 1;
  4376. lbValue ptr = lb_addr_get_ptr(p, addr);
  4377. if (sub_sel.index.count > 0) {
  4378. ptr = lb_emit_deep_field_gep(p, ptr, sub_sel);
  4379. }
  4380. if (is_type_pointer(type_deref(ptr.type))) {
  4381. ptr = lb_emit_load(p, ptr);
  4382. }
  4383. Type *bf_type = type_deref(ptr.type);
  4384. bf_type = base_type(bf_type);
  4385. GB_ASSERT(bf_type->kind == Type_BitField);
  4386. i32 index = sel.index[sel.index.count-1];
  4387. Entity *f = bf_type->BitField.fields[index];
  4388. u8 bit_size = bf_type->BitField.bit_sizes[index];
  4389. i64 bit_offset = bf_type->BitField.bit_offsets[index];
  4390. return lb_addr_bit_field(ptr, f->type, bit_offset, bit_size);
  4391. }
  4392. {
  4393. lbAddr addr = lb_build_addr(p, se->expr);
  4394. if (addr.kind == lbAddr_Map) {
  4395. lbValue v = lb_addr_load(p, addr);
  4396. lbValue a = lb_address_from_load_or_generate_local(p, v);
  4397. a = lb_emit_deep_field_gep(p, a, sel);
  4398. return lb_addr(a);
  4399. } else if (addr.kind == lbAddr_Context) {
  4400. GB_ASSERT(sel.index.count > 0);
  4401. if (addr.ctx.sel.index.count >= 0) {
  4402. sel = selection_combine(addr.ctx.sel, sel);
  4403. }
  4404. addr.ctx.sel = sel;
  4405. addr.kind = lbAddr_Context;
  4406. return addr;
  4407. } else if (addr.kind == lbAddr_SoaVariable) {
  4408. lbValue index = addr.soa.index;
  4409. i32 first_index = sel.index[0];
  4410. Selection sub_sel = sel;
  4411. sub_sel.index.data += 1;
  4412. sub_sel.index.count -= 1;
  4413. lbValue arr = lb_emit_struct_ep(p, addr.addr, first_index);
  4414. Type *t = base_type(type_deref(addr.addr.type));
  4415. GB_ASSERT(is_type_soa_struct(t));
  4416. if (addr.soa.index_expr != nullptr && (!lb_is_const(addr.soa.index) || t->Struct.soa_kind != StructSoa_Fixed)) {
  4417. lbValue len = lb_soa_struct_len(p, addr.addr);
  4418. lb_emit_bounds_check(p, ast_token(addr.soa.index_expr), addr.soa.index, len);
  4419. }
  4420. lbValue item = {};
  4421. if (t->Struct.soa_kind == StructSoa_Fixed) {
  4422. item = lb_emit_array_ep(p, arr, index);
  4423. } else {
  4424. item = lb_emit_ptr_offset(p, lb_emit_load(p, arr), index);
  4425. }
  4426. if (sub_sel.index.count > 0) {
  4427. item = lb_emit_deep_field_gep(p, item, sub_sel);
  4428. }
  4429. // make sure it's ^T and not [^]T
  4430. item.type = alloc_type_multi_pointer_to_pointer(item.type);
  4431. return lb_addr(item);
  4432. } else if (addr.kind == lbAddr_Swizzle) {
  4433. GB_ASSERT(sel.index.count > 0);
  4434. // NOTE(bill): just patch the index in place
  4435. sel.index[0] = addr.swizzle.indices[sel.index[0]];
  4436. } else if (addr.kind == lbAddr_SwizzleLarge) {
  4437. GB_ASSERT(sel.index.count > 0);
  4438. // NOTE(bill): just patch the index in place
  4439. sel.index[0] = addr.swizzle.indices[sel.index[0]];
  4440. }
  4441. Type *atype = type_deref(lb_addr_type(addr));
  4442. if (is_type_soa_struct(atype)) {
  4443. map_set(&p->selector_addr, expr, addr);
  4444. }
  4445. lbValue a = lb_addr_get_ptr(p, addr);
  4446. a = lb_emit_deep_field_gep(p, a, sel);
  4447. return lb_addr(a);
  4448. }
  4449. } else {
  4450. GB_PANIC("Unsupported selector expression");
  4451. }
  4452. case_end;
  4453. case_ast_node(se, SelectorCallExpr, expr);
  4454. lbValue e = lb_build_expr(p, expr);
  4455. return lb_addr(lb_address_from_load_or_generate_local(p, e));
  4456. case_end;
  4457. case_ast_node(ta, TypeAssertion, expr);
  4458. TokenPos pos = ast_token(expr).pos;
  4459. lbValue e = lb_build_expr(p, ta->expr);
  4460. Type *t = type_deref(e.type);
  4461. if (is_type_union(t)) {
  4462. Type *type = type_of_expr(expr);
  4463. lbAddr v = lb_add_local_generated(p, type, false);
  4464. lb_addr_store(p, v, lb_emit_union_cast(p, lb_build_expr(p, ta->expr), type, pos));
  4465. return v;
  4466. } else if (is_type_any(t)) {
  4467. Type *type = type_of_expr(expr);
  4468. return lb_emit_any_cast_addr(p, lb_build_expr(p, ta->expr), type, pos);
  4469. } else {
  4470. GB_PANIC("TODO(bill): type assertion %s", type_to_string(e.type));
  4471. }
  4472. case_end;
  4473. case_ast_node(ue, UnaryExpr, expr);
  4474. switch (ue->op.kind) {
  4475. case Token_And: {
  4476. lbValue ptr = lb_build_expr(p, expr);
  4477. return lb_addr(lb_address_from_load_or_generate_local(p, ptr));
  4478. }
  4479. default:
  4480. GB_PANIC("Invalid unary expression for lb_build_addr");
  4481. }
  4482. case_end;
  4483. case_ast_node(be, BinaryExpr, expr);
  4484. lbValue v = lb_build_expr(p, expr);
  4485. Type *t = v.type;
  4486. if (is_type_pointer(t)) {
  4487. return lb_addr(v);
  4488. }
  4489. return lb_addr(lb_address_from_load_or_generate_local(p, v));
  4490. case_end;
  4491. case_ast_node(ie, IndexExpr, expr);
  4492. return lb_build_addr_index_expr(p, expr);
  4493. case_end;
  4494. case_ast_node(ie, MatrixIndexExpr, expr);
  4495. Type *t = base_type(type_of_expr(ie->expr));
  4496. bool deref = is_type_pointer(t);
  4497. t = base_type(type_deref(t));
  4498. lbValue m = {};
  4499. m = lb_build_addr_ptr(p, ie->expr);
  4500. if (deref) {
  4501. m = lb_emit_load(p, m);
  4502. }
  4503. lbValue row_index = lb_build_expr(p, ie->row_index);
  4504. lbValue column_index = lb_build_expr(p, ie->column_index);
  4505. row_index = lb_emit_conv(p, row_index, t_int);
  4506. column_index = lb_emit_conv(p, column_index, t_int);
  4507. lbValue elem = lb_emit_matrix_ep(p, m, row_index, column_index);
  4508. auto row_index_tv = type_and_value_of_expr(ie->row_index);
  4509. auto column_index_tv = type_and_value_of_expr(ie->column_index);
  4510. if (row_index_tv.mode != Addressing_Constant || column_index_tv.mode != Addressing_Constant) {
  4511. lbValue row_count = lb_const_int(p->module, t_int, t->Matrix.row_count);
  4512. lbValue column_count = lb_const_int(p->module, t_int, t->Matrix.column_count);
  4513. lb_emit_matrix_bounds_check(p, ast_token(ie->row_index), row_index, column_index, row_count, column_count);
  4514. }
  4515. return lb_addr(elem);
  4516. case_end;
  4517. case_ast_node(se, SliceExpr, expr);
  4518. return lb_build_addr_slice_expr(p, expr);
  4519. case_end;
  4520. case_ast_node(de, DerefExpr, expr);
  4521. Type *t = type_of_expr(de->expr);
  4522. if (is_type_relative_pointer(t)) {
  4523. lbAddr addr = lb_build_addr(p, de->expr);
  4524. addr.relative.deref = true;
  4525. return addr;
  4526. } else if (is_type_soa_pointer(t)) {
  4527. lbValue value = lb_build_expr(p, de->expr);
  4528. lbValue ptr = lb_emit_struct_ev(p, value, 0);
  4529. lbValue idx = lb_emit_struct_ev(p, value, 1);
  4530. return lb_addr_soa_variable(ptr, idx, nullptr);
  4531. }
  4532. lbValue addr = lb_build_expr(p, de->expr);
  4533. return lb_addr(addr);
  4534. case_end;
  4535. case_ast_node(ce, CallExpr, expr);
  4536. BuiltinProcId builtin_id = BuiltinProc_Invalid;
  4537. if (ce->proc->tav.mode == Addressing_Builtin) {
  4538. Entity *e = entity_of_node(ce->proc);
  4539. if (e != nullptr) {
  4540. builtin_id = cast(BuiltinProcId)e->Builtin.id;
  4541. } else {
  4542. builtin_id = BuiltinProc_DIRECTIVE;
  4543. }
  4544. }
  4545. auto const &tv = expr->tav;
  4546. if (builtin_id == BuiltinProc_swizzle &&
  4547. is_type_array(tv.type)) {
  4548. // NOTE(bill, 2021-08-09): `swizzle` has some bizarre semantics so it needs to be
  4549. // specialized here for to be addressable
  4550. return lb_build_array_swizzle_addr(p, ce, tv);
  4551. }
  4552. // NOTE(bill): This is make sure you never need to have an 'array_ev'
  4553. lbValue e = lb_build_expr(p, expr);
  4554. #if 1
  4555. return lb_addr(lb_address_from_load_or_generate_local(p, e));
  4556. #else
  4557. lbAddr v = lb_add_local_generated(p, e.type, false);
  4558. lb_addr_store(p, v, e);
  4559. return v;
  4560. #endif
  4561. case_end;
  4562. case_ast_node(cl, CompoundLit, expr);
  4563. return lb_build_addr_compound_lit(p, expr);
  4564. case_end;
  4565. case_ast_node(tc, TypeCast, expr);
  4566. Type *type = type_of_expr(expr);
  4567. lbValue x = lb_build_expr(p, tc->expr);
  4568. lbValue e = {};
  4569. switch (tc->token.kind) {
  4570. case Token_cast:
  4571. e = lb_emit_conv(p, x, type);
  4572. break;
  4573. case Token_transmute:
  4574. e = lb_emit_transmute(p, x, type);
  4575. break;
  4576. default:
  4577. GB_PANIC("Invalid AST TypeCast");
  4578. }
  4579. lbAddr v = lb_add_local_generated(p, type, false);
  4580. lb_addr_store(p, v, e);
  4581. return v;
  4582. case_end;
  4583. case_ast_node(ac, AutoCast, expr);
  4584. return lb_build_addr(p, ac->expr);
  4585. case_end;
  4586. case_ast_node(te, TernaryIfExpr, expr);
  4587. LLVMValueRef incoming_values[2] = {};
  4588. LLVMBasicBlockRef incoming_blocks[2] = {};
  4589. GB_ASSERT(te->y != nullptr);
  4590. lbBlock *then = lb_create_block(p, "if.then");
  4591. lbBlock *done = lb_create_block(p, "if.done"); // NOTE(bill): Append later
  4592. lbBlock *else_ = lb_create_block(p, "if.else");
  4593. lb_build_cond(p, te->cond, then, else_);
  4594. lb_start_block(p, then);
  4595. Type *ptr_type = alloc_type_pointer(default_type(type_of_expr(expr)));
  4596. incoming_values[0] = lb_emit_conv(p, lb_build_addr_ptr(p, te->x), ptr_type).value;
  4597. lb_emit_jump(p, done);
  4598. lb_start_block(p, else_);
  4599. incoming_values[1] = lb_emit_conv(p, lb_build_addr_ptr(p, te->y), ptr_type).value;
  4600. lb_emit_jump(p, done);
  4601. lb_start_block(p, done);
  4602. lbValue res = {};
  4603. res.value = LLVMBuildPhi(p->builder, lb_type(p->module, ptr_type), "");
  4604. res.type = ptr_type;
  4605. GB_ASSERT(p->curr_block->preds.count >= 2);
  4606. incoming_blocks[0] = p->curr_block->preds[0]->block;
  4607. incoming_blocks[1] = p->curr_block->preds[1]->block;
  4608. LLVMAddIncoming(res.value, incoming_values, incoming_blocks, 2);
  4609. return lb_addr(res);
  4610. case_end;
  4611. case_ast_node(oe, OrElseExpr, expr);
  4612. lbValue ptr = lb_address_from_load_or_generate_local(p, lb_build_expr(p, expr));
  4613. return lb_addr(ptr);
  4614. case_end;
  4615. case_ast_node(oe, OrReturnExpr, expr);
  4616. lbValue ptr = lb_address_from_load_or_generate_local(p, lb_build_expr(p, expr));
  4617. return lb_addr(ptr);
  4618. case_end;
  4619. case_ast_node(be, OrBranchExpr, expr);
  4620. lbBlock *block = nullptr;
  4621. if (be->label != nullptr) {
  4622. lbBranchBlocks bb = lb_lookup_branch_blocks(p, be->label);
  4623. switch (be->token.kind) {
  4624. case Token_or_break: block = bb.break_; break;
  4625. case Token_or_continue: block = bb.continue_; break;
  4626. }
  4627. } else {
  4628. for (lbTargetList *t = p->target_list; t != nullptr && block == nullptr; t = t->prev) {
  4629. if (t->is_block) {
  4630. continue;
  4631. }
  4632. switch (be->token.kind) {
  4633. case Token_or_break: block = t->break_; break;
  4634. case Token_or_continue: block = t->continue_; break;
  4635. }
  4636. }
  4637. }
  4638. GB_ASSERT(block != nullptr);
  4639. TypeAndValue tv = expr->tav;
  4640. lbValue lhs = {};
  4641. lbValue rhs = {};
  4642. lb_emit_try_lhs_rhs(p, be->expr, tv, &lhs, &rhs);
  4643. Type *type = default_type(tv.type);
  4644. if (lhs.value) {
  4645. lhs = lb_emit_conv(p, lhs, type);
  4646. } else if (type != nullptr && type != t_invalid) {
  4647. lhs = lb_const_nil(p->module, type);
  4648. }
  4649. lbBlock *then = lb_create_block(p, "or_branch.then");
  4650. lbBlock *else_ = lb_create_block(p, "or_branch.else");
  4651. lb_emit_if(p, lb_emit_try_has_value(p, rhs), then, else_);
  4652. lb_start_block(p, else_);
  4653. lb_emit_defer_stmts(p, lbDeferExit_Branch, block);
  4654. lb_emit_jump(p, block);
  4655. lb_start_block(p, then);
  4656. return lb_addr(lb_address_from_load_or_generate_local(p, lhs));
  4657. case_end;
  4658. }
  4659. TokenPos token_pos = ast_token(expr).pos;
  4660. GB_PANIC("Unexpected address expression\n"
  4661. "\tAst: %.*s @ "
  4662. "%s\n",
  4663. LIT(ast_strings[expr->kind]),
  4664. token_pos_to_string(token_pos));
  4665. return {};
  4666. }