cgcpu.pas 219 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889389038913892389338943895389638973898389939003901390239033904390539063907390839093910391139123913391439153916391739183919392039213922392339243925392639273928392939303931393239333934393539363937393839393940394139423943394439453946394739483949395039513952395339543955395639573958395939603961396239633964396539663967396839693970397139723973397439753976397739783979398039813982398339843985398639873988398939903991399239933994399539963997399839994000400140024003400440054006400740084009401040114012401340144015401640174018401940204021402240234024402540264027402840294030403140324033403440354036403740384039404040414042404340444045404640474048404940504051405240534054405540564057405840594060406140624063406440654066406740684069407040714072407340744075407640774078407940804081408240834084408540864087408840894090409140924093409440954096409740984099410041014102410341044105410641074108410941104111411241134114411541164117411841194120412141224123412441254126412741284129413041314132413341344135413641374138413941404141414241434144414541464147414841494150415141524153415441554156415741584159416041614162416341644165416641674168416941704171417241734174417541764177417841794180418141824183418441854186418741884189419041914192419341944195419641974198419942004201420242034204420542064207420842094210421142124213421442154216421742184219422042214222422342244225422642274228422942304231423242334234423542364237423842394240424142424243424442454246424742484249425042514252425342544255425642574258425942604261426242634264426542664267426842694270427142724273427442754276427742784279428042814282428342844285428642874288428942904291429242934294429542964297429842994300430143024303430443054306430743084309431043114312431343144315431643174318431943204321432243234324432543264327432843294330433143324333433443354336433743384339434043414342434343444345434643474348434943504351435243534354435543564357435843594360436143624363436443654366436743684369437043714372437343744375437643774378437943804381438243834384438543864387438843894390439143924393439443954396439743984399440044014402440344044405440644074408440944104411441244134414441544164417441844194420442144224423442444254426442744284429443044314432443344344435443644374438443944404441444244434444444544464447444844494450445144524453445444554456445744584459446044614462446344644465446644674468446944704471447244734474447544764477447844794480448144824483448444854486448744884489449044914492449344944495449644974498449945004501450245034504450545064507450845094510451145124513451445154516451745184519452045214522452345244525452645274528452945304531453245334534453545364537453845394540454145424543454445454546454745484549455045514552455345544555455645574558455945604561456245634564456545664567456845694570457145724573457445754576457745784579458045814582458345844585458645874588458945904591459245934594459545964597459845994600460146024603460446054606460746084609461046114612461346144615461646174618461946204621462246234624462546264627462846294630463146324633463446354636463746384639464046414642464346444645464646474648464946504651465246534654465546564657465846594660466146624663466446654666466746684669467046714672467346744675467646774678467946804681468246834684468546864687468846894690469146924693469446954696469746984699470047014702470347044705470647074708470947104711471247134714471547164717471847194720472147224723472447254726472747284729473047314732473347344735473647374738473947404741474247434744474547464747474847494750475147524753475447554756475747584759476047614762476347644765476647674768476947704771477247734774477547764777477847794780478147824783478447854786478747884789479047914792479347944795479647974798479948004801480248034804480548064807480848094810481148124813481448154816481748184819482048214822482348244825482648274828482948304831483248334834483548364837483848394840484148424843484448454846484748484849485048514852485348544855485648574858485948604861486248634864486548664867486848694870487148724873487448754876487748784879488048814882488348844885488648874888488948904891489248934894489548964897489848994900490149024903490449054906490749084909491049114912491349144915491649174918491949204921492249234924492549264927492849294930493149324933493449354936493749384939494049414942494349444945494649474948494949504951495249534954495549564957495849594960496149624963496449654966496749684969497049714972497349744975497649774978497949804981498249834984498549864987498849894990499149924993499449954996499749984999500050015002500350045005500650075008500950105011501250135014501550165017501850195020502150225023502450255026502750285029503050315032503350345035503650375038503950405041504250435044504550465047504850495050505150525053505450555056505750585059506050615062506350645065506650675068506950705071507250735074507550765077507850795080508150825083508450855086508750885089509050915092509350945095509650975098509951005101510251035104510551065107510851095110511151125113511451155116511751185119512051215122512351245125512651275128512951305131513251335134513551365137513851395140514151425143514451455146514751485149515051515152515351545155515651575158515951605161516251635164516551665167516851695170517151725173517451755176517751785179518051815182518351845185518651875188518951905191519251935194519551965197519851995200520152025203520452055206520752085209521052115212521352145215521652175218521952205221522252235224522552265227522852295230523152325233523452355236523752385239524052415242524352445245524652475248524952505251525252535254525552565257525852595260526152625263526452655266526752685269527052715272527352745275527652775278527952805281528252835284528552865287528852895290529152925293529452955296529752985299530053015302530353045305530653075308530953105311531253135314531553165317531853195320532153225323532453255326532753285329533053315332533353345335533653375338533953405341534253435344534553465347534853495350535153525353535453555356535753585359536053615362536353645365536653675368536953705371537253735374537553765377537853795380538153825383538453855386538753885389539053915392539353945395539653975398539954005401540254035404540554065407540854095410541154125413541454155416541754185419542054215422542354245425542654275428542954305431543254335434543554365437543854395440544154425443544454455446544754485449545054515452545354545455545654575458
  1. {
  2. Copyright (c) 2003 by Florian Klaempfl
  3. Member of the Free Pascal development team
  4. This unit implements the code generator for the ARM
  5. This program is free software; you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation; either version 2 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program; if not, write to the Free Software
  15. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  16. ****************************************************************************
  17. }
  18. unit cgcpu;
  19. {$i fpcdefs.inc}
  20. interface
  21. uses
  22. globtype,symtype,symdef,
  23. cgbase,cgutils,cgobj,
  24. aasmbase,aasmcpu,aasmtai,aasmdata,
  25. parabase,
  26. cpubase,cpuinfo,cg64f32,rgcpu;
  27. type
  28. { tbasecgarm is shared between all arm architectures }
  29. tbasecgarm = class(tcg)
  30. { true, if the next arithmetic operation should modify the flags }
  31. cgsetflags : boolean;
  32. procedure a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);override;
  33. procedure a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);override;
  34. procedure a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);override;
  35. procedure a_call_name(list : TAsmList;const s : string; weak: boolean);override;
  36. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  37. { move instructions }
  38. procedure a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);override;
  39. procedure a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);override;
  40. function a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  41. function a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  42. { fpu move instructions }
  43. procedure a_loadfpu_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister); override;
  44. procedure a_loadfpu_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister); override;
  45. procedure a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference); override;
  46. procedure a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);override;
  47. { comparison operations }
  48. procedure a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  49. l : tasmlabel);override;
  50. procedure a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel); override;
  51. procedure a_jmp_name(list : TAsmList;const s : string); override;
  52. procedure a_jmp_always(list : TAsmList;l: tasmlabel); override;
  53. procedure a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel); override;
  54. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  55. procedure g_profilecode(list : TAsmList); override;
  56. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  57. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  58. procedure g_maybe_got_init(list : TAsmList); override;
  59. procedure a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);override;
  60. procedure g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);override;
  61. procedure g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);override;
  62. procedure g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  63. procedure g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  64. procedure g_overflowcheck(list: TAsmList; const l: tlocation; def: tdef); override;
  65. procedure g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);override;
  66. procedure g_save_registers(list : TAsmList);override;
  67. procedure g_restore_registers(list : TAsmList);override;
  68. procedure a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  69. procedure fixref(list : TAsmList;var ref : treference);
  70. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; virtual;
  71. procedure g_intf_wrapper(list: TAsmList; procdef: tprocdef; const labelname: string; ioffset: longint);override;
  72. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  73. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  74. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  75. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  76. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  77. procedure a_opmm_reg_reg(list: TAsmList; Op: TOpCG; size : tcgsize;src,dst: tregister;shuffle : pmmshuffle); override;
  78. { Transform unsupported methods into Internal errors }
  79. procedure a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister); override;
  80. { try to generate optimized 32 Bit multiplication, returns true if successful generated }
  81. function try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  82. { clear out potential overflow bits from 8 or 16 bit operations }
  83. { the upper 24/16 bits of a register after an operation }
  84. procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  85. { mla for thumb requires that none of the registers is equal to r13/r15, this method ensures this }
  86. procedure safe_mla(list: TAsmList;op1,op2,op3,op4 : TRegister);
  87. end;
  88. { tcgarm is shared between normal arm and thumb-2 }
  89. tcgarm = class(tbasecgarm)
  90. procedure a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister); override;
  91. procedure a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference); override;
  92. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  93. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  94. size: tcgsize; a: tcgint; src, dst: tregister); override;
  95. procedure a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  96. size: tcgsize; src1, src2, dst: tregister); override;
  97. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  98. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  99. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  100. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  101. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  102. {Multiply two 32-bit registers into lo and hi 32-bit registers}
  103. procedure a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister); override;
  104. end;
  105. { normal arm cg }
  106. tarmcgarm = class(tcgarm)
  107. procedure init_register_allocators;override;
  108. procedure done_register_allocators;override;
  109. end;
  110. { 64 bit cg for all arm flavours }
  111. tbasecg64farm = class(tcg64f32)
  112. end;
  113. { tcg64farm is shared between normal arm and thumb-2 }
  114. tcg64farm = class(tbasecg64farm)
  115. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  116. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  117. procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;
  118. procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  119. procedure a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  120. procedure a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  121. procedure a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);override;
  122. procedure a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);override;
  123. end;
  124. tarmcg64farm = class(tcg64farm)
  125. end;
  126. tthumbcgarm = class(tbasecgarm)
  127. procedure init_register_allocators;override;
  128. procedure done_register_allocators;override;
  129. procedure g_proc_entry(list: TAsmList; localsize: longint; nostackframe: boolean);override;
  130. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  131. procedure a_op_reg_reg(list: TAsmList; Op: TOpCG; size: TCGSize; src,dst: TRegister);override;
  132. procedure a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);override;
  133. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister); override;
  134. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  135. procedure a_load_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const Ref: treference; reg: tregister);override;
  136. procedure a_load_const_reg(list: TAsmList; size: tcgsize; a: tcgint; reg: tregister);override;
  137. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  138. function handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference; override;
  139. procedure g_external_wrapper(list : TAsmList; procdef : tprocdef; const externalname : string); override;
  140. end;
  141. tthumbcg64farm = class(tbasecg64farm)
  142. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  143. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  144. end;
  145. tthumb2cgarm = class(tcgarm)
  146. procedure init_register_allocators;override;
  147. procedure done_register_allocators;override;
  148. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  149. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  150. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  151. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  152. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  153. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  154. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  155. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  156. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  157. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; override;
  158. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  159. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  160. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  161. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  162. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  163. end;
  164. tthumb2cg64farm = class(tcg64farm)
  165. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  166. end;
  167. const
  168. OpCmp2AsmCond : Array[topcmp] of TAsmCond = (C_NONE,C_EQ,C_GT,
  169. C_LT,C_GE,C_LE,C_NE,C_LS,C_CC,C_CS,C_HI);
  170. winstackpagesize = 4096;
  171. function get_fpu_postfix(def : tdef) : toppostfix;
  172. procedure create_codegen;
  173. implementation
  174. uses
  175. globals,verbose,systems,cutils,
  176. aopt,aoptcpu,
  177. fmodule,
  178. symconst,symsym,symtable,
  179. tgobj,
  180. procinfo,cpupi,
  181. paramgr;
  182. function get_fpu_postfix(def : tdef) : toppostfix;
  183. begin
  184. if def.typ=floatdef then
  185. begin
  186. case tfloatdef(def).floattype of
  187. s32real:
  188. result:=PF_S;
  189. s64real:
  190. result:=PF_D;
  191. s80real:
  192. result:=PF_E;
  193. else
  194. internalerror(200401272);
  195. end;
  196. end
  197. else
  198. internalerror(200401271);
  199. end;
  200. procedure tarmcgarm.init_register_allocators;
  201. begin
  202. inherited init_register_allocators;
  203. { currently, we always save R14, so we can use it }
  204. if (target_info.system<>system_arm_darwin) then
  205. begin
  206. if assigned(current_procinfo) and (current_procinfo.framepointer<>NR_R11) then
  207. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  208. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  209. RS_R9,RS_R10,RS_R11,RS_R14],first_int_imreg,[])
  210. else
  211. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  212. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  213. RS_R9,RS_R10,RS_R14],first_int_imreg,[])
  214. end
  215. else
  216. { r7 is not available on Darwin, it's used as frame pointer (always,
  217. for backtrace support -- also in gcc/clang -> R11 can be used).
  218. r9 is volatile }
  219. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  220. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R9,RS_R12,RS_R4,RS_R5,RS_R6,RS_R8,
  221. RS_R10,RS_R11,RS_R14],first_int_imreg,[]);
  222. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  223. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  224. { The register allocator currently cannot deal with multiple
  225. non-overlapping subregs per register, so we can only use
  226. half the single precision registers for now (as sub registers of the
  227. double precision ones). }
  228. if current_settings.fputype=fpu_vfpv3 then
  229. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  230. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  231. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  232. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  233. ],first_mm_imreg,[])
  234. else
  235. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  236. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15],first_mm_imreg,[]);
  237. end;
  238. procedure tarmcgarm.done_register_allocators;
  239. begin
  240. rg[R_INTREGISTER].free;
  241. rg[R_FPUREGISTER].free;
  242. rg[R_MMREGISTER].free;
  243. inherited done_register_allocators;
  244. end;
  245. procedure tcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  246. var
  247. imm_shift : byte;
  248. l : tasmlabel;
  249. hr : treference;
  250. imm1, imm2: DWord;
  251. begin
  252. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  253. internalerror(2002090902);
  254. if is_shifter_const(a,imm_shift) then
  255. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  256. else if is_shifter_const(not(a),imm_shift) then
  257. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  258. { loading of constants with mov and orr }
  259. else if (split_into_shifter_const(a,imm1, imm2)) then
  260. begin
  261. list.concat(taicpu.op_reg_const(A_MOV,reg, imm1));
  262. list.concat(taicpu.op_reg_reg_const(A_ORR,reg,reg, imm2));
  263. end
  264. { loading of constants with mvn and bic }
  265. else if (split_into_shifter_const(not(a), imm1, imm2)) then
  266. begin
  267. list.concat(taicpu.op_reg_const(A_MVN,reg, imm1));
  268. list.concat(taicpu.op_reg_reg_const(A_BIC,reg,reg, imm2));
  269. end
  270. else
  271. begin
  272. reference_reset(hr,4);
  273. current_asmdata.getjumplabel(l);
  274. cg.a_label(current_procinfo.aktlocaldata,l);
  275. hr.symboldata:=current_procinfo.aktlocaldata.last;
  276. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  277. hr.symbol:=l;
  278. hr.base:=NR_PC;
  279. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  280. end;
  281. end;
  282. procedure tcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  283. var
  284. oppostfix:toppostfix;
  285. usedtmpref: treference;
  286. tmpreg,tmpreg2 : tregister;
  287. so : tshifterop;
  288. dir : integer;
  289. begin
  290. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  291. FromSize := ToSize;
  292. case FromSize of
  293. { signed integer registers }
  294. OS_8:
  295. oppostfix:=PF_B;
  296. OS_S8:
  297. oppostfix:=PF_SB;
  298. OS_16:
  299. oppostfix:=PF_H;
  300. OS_S16:
  301. oppostfix:=PF_SH;
  302. OS_32,
  303. OS_S32:
  304. oppostfix:=PF_None;
  305. else
  306. InternalError(200308297);
  307. end;
  308. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  309. begin
  310. if target_info.endian=endian_big then
  311. dir:=-1
  312. else
  313. dir:=1;
  314. case FromSize of
  315. OS_16,OS_S16:
  316. begin
  317. { only complicated references need an extra loadaddr }
  318. if assigned(ref.symbol) or
  319. (ref.index<>NR_NO) or
  320. (ref.offset<-4095) or
  321. (ref.offset>4094) or
  322. { sometimes the compiler reused registers }
  323. (reg=ref.index) or
  324. (reg=ref.base) then
  325. begin
  326. tmpreg2:=getintregister(list,OS_INT);
  327. a_loadaddr_ref_reg(list,ref,tmpreg2);
  328. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  329. end
  330. else
  331. usedtmpref:=ref;
  332. if target_info.endian=endian_big then
  333. inc(usedtmpref.offset,1);
  334. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  335. tmpreg:=getintregister(list,OS_INT);
  336. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  337. inc(usedtmpref.offset,dir);
  338. if FromSize=OS_16 then
  339. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  340. else
  341. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  342. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  343. end;
  344. OS_32,OS_S32:
  345. begin
  346. tmpreg:=getintregister(list,OS_INT);
  347. { only complicated references need an extra loadaddr }
  348. if assigned(ref.symbol) or
  349. (ref.index<>NR_NO) or
  350. (ref.offset<-4095) or
  351. (ref.offset>4092) or
  352. { sometimes the compiler reused registers }
  353. (reg=ref.index) or
  354. (reg=ref.base) then
  355. begin
  356. tmpreg2:=getintregister(list,OS_INT);
  357. a_loadaddr_ref_reg(list,ref,tmpreg2);
  358. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  359. end
  360. else
  361. usedtmpref:=ref;
  362. shifterop_reset(so);so.shiftmode:=SM_LSL;
  363. if ref.alignment=2 then
  364. begin
  365. if target_info.endian=endian_big then
  366. inc(usedtmpref.offset,2);
  367. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  368. inc(usedtmpref.offset,dir*2);
  369. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  370. so.shiftimm:=16;
  371. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  372. end
  373. else
  374. begin
  375. tmpreg2:=getintregister(list,OS_INT);
  376. if target_info.endian=endian_big then
  377. inc(usedtmpref.offset,3);
  378. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  379. inc(usedtmpref.offset,dir);
  380. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  381. inc(usedtmpref.offset,dir);
  382. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg2);
  383. so.shiftimm:=8;
  384. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  385. inc(usedtmpref.offset,dir);
  386. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  387. so.shiftimm:=16;
  388. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg2,so));
  389. so.shiftimm:=24;
  390. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  391. end;
  392. end
  393. else
  394. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  395. end;
  396. end
  397. else
  398. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  399. if (fromsize=OS_S8) and (tosize = OS_16) then
  400. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  401. end;
  402. procedure tcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  403. var
  404. hsym : tsym;
  405. href : treference;
  406. paraloc : Pcgparalocation;
  407. shift : byte;
  408. begin
  409. { calculate the parameter info for the procdef }
  410. procdef.init_paraloc_info(callerside);
  411. hsym:=tsym(procdef.parast.Find('self'));
  412. if not(assigned(hsym) and
  413. (hsym.typ=paravarsym)) then
  414. internalerror(200305251);
  415. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  416. while paraloc<>nil do
  417. with paraloc^ do
  418. begin
  419. case loc of
  420. LOC_REGISTER:
  421. begin
  422. if is_shifter_const(ioffset,shift) then
  423. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  424. else
  425. begin
  426. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  427. a_op_reg_reg(list,OP_SUB,size,NR_R12,register);
  428. end;
  429. end;
  430. LOC_REFERENCE:
  431. begin
  432. { offset in the wrapper needs to be adjusted for the stored
  433. return address }
  434. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),sizeof(pint));
  435. if is_shifter_const(ioffset,shift) then
  436. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  437. else
  438. begin
  439. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  440. a_op_reg_ref(list,OP_SUB,size,NR_R12,href);
  441. end;
  442. end
  443. else
  444. internalerror(200309189);
  445. end;
  446. paraloc:=next;
  447. end;
  448. end;
  449. procedure tbasecgarm.a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);
  450. var
  451. ref: treference;
  452. begin
  453. paraloc.check_simple_location;
  454. paramanager.allocparaloc(list,paraloc.location);
  455. case paraloc.location^.loc of
  456. LOC_REGISTER,LOC_CREGISTER:
  457. a_load_const_reg(list,size,a,paraloc.location^.register);
  458. LOC_REFERENCE:
  459. begin
  460. reference_reset(ref,paraloc.alignment);
  461. ref.base:=paraloc.location^.reference.index;
  462. ref.offset:=paraloc.location^.reference.offset;
  463. a_load_const_ref(list,size,a,ref);
  464. end;
  465. else
  466. internalerror(2002081101);
  467. end;
  468. end;
  469. procedure tbasecgarm.a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);
  470. var
  471. tmpref, ref: treference;
  472. location: pcgparalocation;
  473. sizeleft: aint;
  474. begin
  475. location := paraloc.location;
  476. tmpref := r;
  477. sizeleft := paraloc.intsize;
  478. while assigned(location) do
  479. begin
  480. paramanager.allocparaloc(list,location);
  481. case location^.loc of
  482. LOC_REGISTER,LOC_CREGISTER:
  483. a_load_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  484. LOC_REFERENCE:
  485. begin
  486. reference_reset_base(ref,location^.reference.index,location^.reference.offset,paraloc.alignment);
  487. { doubles in softemu mode have a strange order of registers and references }
  488. if location^.size=OS_32 then
  489. g_concatcopy(list,tmpref,ref,4)
  490. else
  491. begin
  492. g_concatcopy(list,tmpref,ref,sizeleft);
  493. if assigned(location^.next) then
  494. internalerror(2005010710);
  495. end;
  496. end;
  497. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  498. case location^.size of
  499. OS_F32, OS_F64:
  500. a_loadfpu_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  501. else
  502. internalerror(2002072801);
  503. end;
  504. LOC_VOID:
  505. begin
  506. // nothing to do
  507. end;
  508. else
  509. internalerror(2002081103);
  510. end;
  511. inc(tmpref.offset,tcgsize2size[location^.size]);
  512. dec(sizeleft,tcgsize2size[location^.size]);
  513. location := location^.next;
  514. end;
  515. end;
  516. procedure tbasecgarm.a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);
  517. var
  518. ref: treference;
  519. tmpreg: tregister;
  520. begin
  521. paraloc.check_simple_location;
  522. paramanager.allocparaloc(list,paraloc.location);
  523. case paraloc.location^.loc of
  524. LOC_REGISTER,LOC_CREGISTER:
  525. a_loadaddr_ref_reg(list,r,paraloc.location^.register);
  526. LOC_REFERENCE:
  527. begin
  528. reference_reset(ref,paraloc.alignment);
  529. ref.base := paraloc.location^.reference.index;
  530. ref.offset := paraloc.location^.reference.offset;
  531. tmpreg := getintregister(list,OS_ADDR);
  532. a_loadaddr_ref_reg(list,r,tmpreg);
  533. a_load_reg_ref(list,OS_ADDR,OS_ADDR,tmpreg,ref);
  534. end;
  535. else
  536. internalerror(2002080701);
  537. end;
  538. end;
  539. procedure tbasecgarm.a_call_name(list : TAsmList;const s : string; weak: boolean);
  540. var
  541. branchopcode: tasmop;
  542. r : treference;
  543. sym : TAsmSymbol;
  544. begin
  545. { check not really correct: should only be used for non-Thumb cpus }
  546. if CPUARM_HAS_BLX_LABEL in cpu_capabilities[current_settings.cputype] then
  547. branchopcode:=A_BLX
  548. else
  549. branchopcode:=A_BL;
  550. if not(weak) then
  551. sym:=current_asmdata.RefAsmSymbol(s)
  552. else
  553. sym:=current_asmdata.WeakRefAsmSymbol(s);
  554. reference_reset_symbol(r,sym,0,sizeof(pint));
  555. if (tf_pic_uses_got in target_info.flags) and
  556. (cs_create_pic in current_settings.moduleswitches) then
  557. begin
  558. r.refaddr:=addr_pic
  559. end
  560. else
  561. r.refaddr:=addr_full;
  562. list.concat(taicpu.op_ref(branchopcode,r));
  563. {
  564. the compiler does not properly set this flag anymore in pass 1, and
  565. for now we only need it after pass 2 (I hope) (JM)
  566. if not(pi_do_call in current_procinfo.flags) then
  567. internalerror(2003060703);
  568. }
  569. include(current_procinfo.flags,pi_do_call);
  570. end;
  571. procedure tbasecgarm.a_call_reg(list : TAsmList;reg: tregister);
  572. begin
  573. { check not really correct: should only be used for non-Thumb cpus }
  574. if not(CPUARM_HAS_BLX in cpu_capabilities[current_settings.cputype]) then
  575. begin
  576. list.concat(taicpu.op_reg_reg(A_MOV,NR_R14,NR_PC));
  577. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,reg));
  578. end
  579. else
  580. list.concat(taicpu.op_reg(A_BLX, reg));
  581. {
  582. the compiler does not properly set this flag anymore in pass 1, and
  583. for now we only need it after pass 2 (I hope) (JM)
  584. if not(pi_do_call in current_procinfo.flags) then
  585. internalerror(2003060703);
  586. }
  587. include(current_procinfo.flags,pi_do_call);
  588. end;
  589. procedure tcgarm.a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister);
  590. begin
  591. a_op_const_reg_reg(list,op,size,a,reg,reg);
  592. end;
  593. procedure tcgarm.a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference);
  594. var
  595. tmpreg,tmpresreg : tregister;
  596. tmpref : treference;
  597. begin
  598. tmpreg:=getintregister(list,size);
  599. tmpresreg:=getintregister(list,size);
  600. tmpref:=a_internal_load_ref_reg(list,size,size,ref,tmpreg);
  601. a_op_const_reg_reg(list,op,size,a,tmpreg,tmpresreg);
  602. a_load_reg_ref(list,size,size,tmpresreg,tmpref);
  603. end;
  604. procedure tcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  605. var
  606. so : tshifterop;
  607. begin
  608. if op = OP_NEG then
  609. begin
  610. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,src,0));
  611. maybeadjustresult(list,OP_NEG,size,dst);
  612. end
  613. else if op = OP_NOT then
  614. begin
  615. if size in [OS_8, OS_16, OS_S8, OS_S16] then
  616. begin
  617. shifterop_reset(so);
  618. so.shiftmode:=SM_LSL;
  619. if size in [OS_8, OS_S8] then
  620. so.shiftimm:=24
  621. else
  622. so.shiftimm:=16;
  623. list.concat(taicpu.op_reg_reg_shifterop(A_MVN,dst,src,so));
  624. {Using a shift here allows this to be folded into another instruction}
  625. if size in [OS_S8, OS_S16] then
  626. so.shiftmode:=SM_ASR
  627. else
  628. so.shiftmode:=SM_LSR;
  629. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  630. end
  631. else
  632. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  633. end
  634. else
  635. a_op_reg_reg_reg(list,op,size,src,dst,dst);
  636. end;
  637. const
  638. op_reg_reg_opcg2asmop: array[TOpCG] of tasmop =
  639. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  640. A_NONE,A_NONE,A_NONE,A_SUB,A_EOR,A_NONE,A_NONE);
  641. op_reg_opcg2asmop: array[TOpCG] of tasmop =
  642. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  643. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  644. op_reg_postfix: array[TOpCG] of TOpPostfix =
  645. (PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,
  646. PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None);
  647. procedure tcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  648. size: tcgsize; a: tcgint; src, dst: tregister);
  649. var
  650. ovloc : tlocation;
  651. begin
  652. a_op_const_reg_reg_checkoverflow(list,op,size,a,src,dst,false,ovloc);
  653. end;
  654. procedure tcgarm.a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  655. size: tcgsize; src1, src2, dst: tregister);
  656. var
  657. ovloc : tlocation;
  658. begin
  659. a_op_reg_reg_reg_checkoverflow(list,op,size,src1,src2,dst,false,ovloc);
  660. end;
  661. function opshift2shiftmode(op: TOpCg): tshiftmode;
  662. begin
  663. case op of
  664. OP_SHL: Result:=SM_LSL;
  665. OP_SHR: Result:=SM_LSR;
  666. OP_ROR: Result:=SM_ROR;
  667. OP_ROL: Result:=SM_ROR;
  668. OP_SAR: Result:=SM_ASR;
  669. else internalerror(2012070501);
  670. end
  671. end;
  672. function tbasecgarm.try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  673. var
  674. multiplier : dword;
  675. power : longint;
  676. shifterop : tshifterop;
  677. bitsset : byte;
  678. negative : boolean;
  679. first : boolean;
  680. b,
  681. cycles : byte;
  682. maxeffort : byte;
  683. begin
  684. result:=true;
  685. cycles:=0;
  686. negative:=a<0;
  687. shifterop.rs:=NR_NO;
  688. shifterop.shiftmode:=SM_LSL;
  689. if negative then
  690. inc(cycles);
  691. multiplier:=dword(abs(a));
  692. bitsset:=popcnt(multiplier and $fffffffe);
  693. { heuristics to estimate how much instructions are reasonable to replace the mul,
  694. this is currently based on XScale timings }
  695. { in the simplest case, we need a mov to load the constant and a mul to carry out the
  696. actual multiplication, this requires min. 1+4 cycles
  697. because the first shift imm. might cause a stall and because we need more instructions
  698. when replacing the mul we generate max. 3 instructions to replace this mul }
  699. maxeffort:=3;
  700. { if the constant is not a shifter op, we need either some mov/mvn/bic/or sequence or
  701. a ldr, so generating one more operation to replace this is beneficial }
  702. if not(is_shifter_const(dword(a),b)) and not(is_shifter_const(not(dword(a)),b)) then
  703. inc(maxeffort);
  704. { if the upper 5 bits are all set or clear, mul is one cycle faster }
  705. if ((dword(a) and $f8000000)=0) or ((dword(a) and $f8000000)=$f8000000) then
  706. dec(maxeffort);
  707. { if the upper 17 bits are all set or clear, mul is another cycle faster }
  708. if ((dword(a) and $ffff8000)=0) or ((dword(a) and $ffff8000)=$ffff8000) then
  709. dec(maxeffort);
  710. { most simple cases }
  711. if a=1 then
  712. a_load_reg_reg(list,OS_32,OS_32,src,dst)
  713. else if a=0 then
  714. a_load_const_reg(list,OS_32,0,dst)
  715. else if a=-1 then
  716. a_op_reg_reg(list,OP_NEG,OS_32,src,dst)
  717. { add up ?
  718. basically, one add is needed for each bit being set in the constant factor
  719. however, the least significant bit is for free, it can be hidden in the initial
  720. instruction
  721. }
  722. else if (bitsset+cycles<=maxeffort) and
  723. (bitsset<=popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)) then
  724. begin
  725. first:=true;
  726. while multiplier<>0 do
  727. begin
  728. shifterop.shiftimm:=BsrDWord(multiplier);
  729. if odd(multiplier) then
  730. begin
  731. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,shifterop));
  732. dec(multiplier);
  733. end
  734. else
  735. if first then
  736. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  737. else
  738. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,src,shifterop));
  739. first:=false;
  740. dec(multiplier,1 shl shifterop.shiftimm);
  741. end;
  742. if negative then
  743. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  744. end
  745. { subtract from the next greater power of two? }
  746. else if popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)+cycles+1<=maxeffort then
  747. begin
  748. first:=true;
  749. while multiplier<>0 do
  750. begin
  751. if first then
  752. begin
  753. multiplier:=(1 shl power)-multiplier;
  754. shifterop.shiftimm:=power;
  755. end
  756. else
  757. shifterop.shiftimm:=BsrDWord(multiplier);
  758. if odd(multiplier) then
  759. begin
  760. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,shifterop));
  761. dec(multiplier);
  762. end
  763. else
  764. if first then
  765. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  766. else
  767. begin
  768. list.concat(taicpu.op_reg_reg_reg_shifterop(A_SUB,dst,dst,src,shifterop));
  769. dec(multiplier,1 shl shifterop.shiftimm);
  770. end;
  771. first:=false;
  772. end;
  773. if negative then
  774. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  775. end
  776. else
  777. result:=false;
  778. end;
  779. procedure tcgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  780. var
  781. shift, lsb, width : byte;
  782. tmpreg : tregister;
  783. so : tshifterop;
  784. l1 : longint;
  785. imm1, imm2: DWord;
  786. begin
  787. optimize_op_const(size, op, a);
  788. case op of
  789. OP_NONE:
  790. begin
  791. if src <> dst then
  792. a_load_reg_reg(list, size, size, src, dst);
  793. exit;
  794. end;
  795. OP_MOVE:
  796. begin
  797. a_load_const_reg(list, size, a, dst);
  798. exit;
  799. end;
  800. end;
  801. ovloc.loc:=LOC_VOID;
  802. if {$ifopt R+}(a<>-2147483648) and{$endif} not setflags and is_shifter_const(-a,shift) then
  803. case op of
  804. OP_ADD:
  805. begin
  806. op:=OP_SUB;
  807. a:=aint(dword(-a));
  808. end;
  809. OP_SUB:
  810. begin
  811. op:=OP_ADD;
  812. a:=aint(dword(-a));
  813. end
  814. end;
  815. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  816. case op of
  817. OP_NEG,OP_NOT:
  818. internalerror(200308281);
  819. OP_SHL,
  820. OP_SHR,
  821. OP_ROL,
  822. OP_ROR,
  823. OP_SAR:
  824. begin
  825. if a>32 then
  826. internalerror(200308294);
  827. shifterop_reset(so);
  828. so.shiftmode:=opshift2shiftmode(op);
  829. if op = OP_ROL then
  830. so.shiftimm:=32-a
  831. else
  832. so.shiftimm:=a;
  833. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  834. end;
  835. else
  836. {if (op in [OP_SUB, OP_ADD]) and
  837. ((a < 0) or
  838. (a > 4095)) then
  839. begin
  840. tmpreg:=getintregister(list,size);
  841. list.concat(taicpu.op_reg_const(A_MOVT, tmpreg, (a shr 16) and $FFFF));
  842. list.concat(taicpu.op_reg_const(A_MOV, tmpreg, a and $FFFF));
  843. list.concat(setoppostfix(taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))
  844. ));
  845. end
  846. else}
  847. begin
  848. if cgsetflags or setflags then
  849. a_reg_alloc(list,NR_DEFAULTFLAGS);
  850. list.concat(setoppostfix(
  851. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  852. end;
  853. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  854. begin
  855. ovloc.loc:=LOC_FLAGS;
  856. case op of
  857. OP_ADD:
  858. ovloc.resflags:=F_CS;
  859. OP_SUB:
  860. ovloc.resflags:=F_CC;
  861. end;
  862. end;
  863. end
  864. else
  865. begin
  866. { there could be added some more sophisticated optimizations }
  867. if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  868. a_op_reg_reg(list,OP_NEG,size,src,dst)
  869. { we do this here instead in the peephole optimizer because
  870. it saves us a register }
  871. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  872. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  873. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  874. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  875. begin
  876. if l1>32 then{roozbeh does this ever happen?}
  877. internalerror(200308296);
  878. shifterop_reset(so);
  879. so.shiftmode:=SM_LSL;
  880. so.shiftimm:=l1;
  881. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  882. end
  883. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  884. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  885. begin
  886. if l1>32 then{does this ever happen?}
  887. internalerror(201205181);
  888. shifterop_reset(so);
  889. so.shiftmode:=SM_LSL;
  890. so.shiftimm:=l1;
  891. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  892. end
  893. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  894. begin
  895. { nothing to do on success }
  896. end
  897. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  898. broader range of shifterconstants.}
  899. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  900. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  901. { Doing two shifts instead of two bics might allow the peephole optimizer to fold the second shift
  902. into the following instruction}
  903. else if (op = OP_AND) and
  904. is_continuous_mask(a, lsb, width) and
  905. ((lsb = 0) or ((lsb + width) = 32)) then
  906. begin
  907. shifterop_reset(so);
  908. if (width = 16) and
  909. (lsb = 0) and
  910. (current_settings.cputype >= cpu_armv6) then
  911. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  912. else if (width = 8) and
  913. (lsb = 0) and
  914. (current_settings.cputype >= cpu_armv6) then
  915. list.concat(taicpu.op_reg_reg(A_UXTB,dst,src))
  916. else if lsb = 0 then
  917. begin
  918. so.shiftmode:=SM_LSL;
  919. so.shiftimm:=32-width;
  920. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  921. so.shiftmode:=SM_LSR;
  922. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  923. end
  924. else
  925. begin
  926. so.shiftmode:=SM_LSR;
  927. so.shiftimm:=lsb;
  928. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  929. so.shiftmode:=SM_LSL;
  930. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  931. end;
  932. end
  933. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  934. begin
  935. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,imm1));
  936. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  937. end
  938. else if (op in [OP_ADD, OP_SUB, OP_OR, OP_XOR]) and
  939. not(cgsetflags or setflags) and
  940. split_into_shifter_const(a, imm1, imm2) then
  941. begin
  942. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,imm1));
  943. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  944. end
  945. else
  946. begin
  947. tmpreg:=getintregister(list,size);
  948. a_load_const_reg(list,size,a,tmpreg);
  949. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  950. end;
  951. end;
  952. maybeadjustresult(list,op,size,dst);
  953. end;
  954. procedure tcgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  955. var
  956. so : tshifterop;
  957. tmpreg,overflowreg : tregister;
  958. asmop : tasmop;
  959. begin
  960. ovloc.loc:=LOC_VOID;
  961. case op of
  962. OP_NEG,OP_NOT,
  963. OP_DIV,OP_IDIV:
  964. internalerror(200308283);
  965. OP_SHL,
  966. OP_SHR,
  967. OP_SAR,
  968. OP_ROR:
  969. begin
  970. if (op = OP_ROR) and not(size in [OS_32,OS_S32]) then
  971. internalerror(2008072801);
  972. shifterop_reset(so);
  973. so.rs:=src1;
  974. so.shiftmode:=opshift2shiftmode(op);
  975. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  976. end;
  977. OP_ROL:
  978. begin
  979. if not(size in [OS_32,OS_S32]) then
  980. internalerror(2008072801);
  981. { simulate ROL by ror'ing 32-value }
  982. tmpreg:=getintregister(list,OS_32);
  983. list.concat(taicpu.op_reg_reg_const(A_RSB,tmpreg,src1, 32));
  984. shifterop_reset(so);
  985. so.rs:=tmpreg;
  986. so.shiftmode:=SM_ROR;
  987. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  988. end;
  989. OP_IMUL,
  990. OP_MUL:
  991. begin
  992. if cgsetflags or setflags then
  993. begin
  994. overflowreg:=getintregister(list,size);
  995. if op=OP_IMUL then
  996. asmop:=A_SMULL
  997. else
  998. asmop:=A_UMULL;
  999. { the arm doesn't allow that rd and rm are the same }
  1000. if dst=src2 then
  1001. begin
  1002. if dst<>src1 then
  1003. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  1004. else
  1005. begin
  1006. tmpreg:=getintregister(list,size);
  1007. a_load_reg_reg(list,size,size,src2,dst);
  1008. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  1009. end;
  1010. end
  1011. else
  1012. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  1013. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1014. if op=OP_IMUL then
  1015. begin
  1016. shifterop_reset(so);
  1017. so.shiftmode:=SM_ASR;
  1018. so.shiftimm:=31;
  1019. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  1020. end
  1021. else
  1022. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  1023. ovloc.loc:=LOC_FLAGS;
  1024. ovloc.resflags:=F_NE;
  1025. end
  1026. else
  1027. begin
  1028. { the arm doesn't allow that rd and rm are the same }
  1029. if dst=src2 then
  1030. begin
  1031. if dst<>src1 then
  1032. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  1033. else
  1034. begin
  1035. tmpreg:=getintregister(list,size);
  1036. a_load_reg_reg(list,size,size,src2,dst);
  1037. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  1038. end;
  1039. end
  1040. else
  1041. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  1042. end;
  1043. end;
  1044. else
  1045. begin
  1046. if cgsetflags or setflags then
  1047. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1048. list.concat(setoppostfix(
  1049. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  1050. end;
  1051. end;
  1052. maybeadjustresult(list,op,size,dst);
  1053. end;
  1054. procedure tcgarm.a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister);
  1055. var
  1056. asmop: tasmop;
  1057. begin
  1058. list.concat(tai_comment.create(strpnew('tcgarm.a_mul_reg_reg_pair called')));
  1059. case size of
  1060. OS_32: asmop:=A_UMULL;
  1061. OS_S32: asmop:=A_SMULL;
  1062. else
  1063. InternalError(2014060802);
  1064. end;
  1065. { The caller might omit dstlo or dsthi, when he is not interested in it, we still
  1066. need valid registers everywhere. In case of dsthi = NR_NO we could fall back to
  1067. 32x32=32 bit multiplication}
  1068. if (dstlo = NR_NO) then
  1069. dstlo:=getintregister(list,size);
  1070. if (dsthi = NR_NO) then
  1071. dsthi:=getintregister(list,size);
  1072. list.concat(taicpu.op_reg_reg_reg_reg(asmop, dstlo, dsthi, src1,src2));
  1073. end;
  1074. function tbasecgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  1075. var
  1076. tmpreg1,tmpreg2 : tregister;
  1077. tmpref : treference;
  1078. l : tasmlabel;
  1079. begin
  1080. tmpreg1:=NR_NO;
  1081. { Be sure to have a base register }
  1082. if (ref.base=NR_NO) then
  1083. begin
  1084. if ref.shiftmode<>SM_None then
  1085. internalerror(2014020701);
  1086. ref.base:=ref.index;
  1087. ref.index:=NR_NO;
  1088. end;
  1089. { absolute symbols can't be handled directly, we've to store the symbol reference
  1090. in the text segment and access it pc relative
  1091. For now, we assume that references where base or index equals to PC are already
  1092. relative, all other references are assumed to be absolute and thus they need
  1093. to be handled extra.
  1094. A proper solution would be to change refoptions to a set and store the information
  1095. if the symbol is absolute or relative there.
  1096. }
  1097. if (assigned(ref.symbol) and
  1098. not(is_pc(ref.base)) and
  1099. not(is_pc(ref.index))
  1100. ) or
  1101. { [#xxx] isn't a valid address operand }
  1102. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  1103. (ref.offset<-4095) or
  1104. (ref.offset>4095) or
  1105. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  1106. ((ref.offset<-255) or
  1107. (ref.offset>255)
  1108. )
  1109. ) or
  1110. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1111. ((ref.offset<-1020) or
  1112. (ref.offset>1020) or
  1113. ((abs(ref.offset) mod 4)<>0)
  1114. )
  1115. ) or
  1116. ((GenerateThumbCode) and
  1117. (((oppostfix in [PF_SB,PF_SH]) and (ref.offset<>0)) or
  1118. ((oppostfix=PF_None) and ((ref.offset<0) or ((ref.base<>NR_STACK_POINTER_REG) and (ref.offset>124)) or
  1119. ((ref.base=NR_STACK_POINTER_REG) and (ref.offset>1020)) or ((ref.offset mod 4)<>0))) or
  1120. ((oppostfix=PF_H) and ((ref.offset<0) or (ref.offset>62) or ((ref.offset mod 2)<>0) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0)))) or
  1121. ((oppostfix=PF_B) and ((ref.offset<0) or (ref.offset>31) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0))))
  1122. )
  1123. ) then
  1124. begin
  1125. fixref(list,ref);
  1126. end;
  1127. if GenerateThumbCode then
  1128. begin
  1129. { certain thumb load require base and index }
  1130. if (oppostfix in [PF_SB,PF_SH]) and
  1131. (ref.base<>NR_NO) and (ref.index=NR_NO) then
  1132. begin
  1133. tmpreg1:=getintregister(list,OS_ADDR);
  1134. a_load_const_reg(list,OS_ADDR,0,tmpreg1);
  1135. ref.index:=tmpreg1;
  1136. end;
  1137. { "hi" registers cannot be used as base or index }
  1138. if (getsupreg(ref.base) in [RS_R8..RS_R12,RS_R14]) or
  1139. ((ref.base=NR_R13) and (ref.index<>NR_NO)) then
  1140. begin
  1141. tmpreg1:=getintregister(list,OS_ADDR);
  1142. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.base,tmpreg1);
  1143. ref.base:=tmpreg1;
  1144. end;
  1145. if getsupreg(ref.index) in [RS_R8..RS_R14] then
  1146. begin
  1147. tmpreg1:=getintregister(list,OS_ADDR);
  1148. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.index,tmpreg1);
  1149. ref.index:=tmpreg1;
  1150. end;
  1151. end;
  1152. { fold if there is base, index and offset, however, don't fold
  1153. for vfp memory instructions because we later fold the index }
  1154. if not((op in [A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1155. (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  1156. begin
  1157. if tmpreg1<>NR_NO then
  1158. begin
  1159. tmpreg2:=getintregister(list,OS_ADDR);
  1160. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg1,tmpreg2);
  1161. tmpreg1:=tmpreg2;
  1162. end
  1163. else
  1164. begin
  1165. tmpreg1:=getintregister(list,OS_ADDR);
  1166. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg1);
  1167. ref.base:=tmpreg1;
  1168. end;
  1169. ref.offset:=0;
  1170. end;
  1171. { floating point operations have only limited references
  1172. we expect here, that a base is already set }
  1173. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  1174. begin
  1175. if ref.shiftmode<>SM_none then
  1176. internalerror(200309121);
  1177. if tmpreg1<>NR_NO then
  1178. begin
  1179. if ref.base=tmpreg1 then
  1180. begin
  1181. if ref.signindex<0 then
  1182. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,tmpreg1,ref.index))
  1183. else
  1184. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,tmpreg1,ref.index));
  1185. ref.index:=NR_NO;
  1186. end
  1187. else
  1188. begin
  1189. if ref.index<>tmpreg1 then
  1190. internalerror(200403161);
  1191. if ref.signindex<0 then
  1192. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,ref.base,tmpreg1))
  1193. else
  1194. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,tmpreg1));
  1195. ref.base:=tmpreg1;
  1196. ref.index:=NR_NO;
  1197. end;
  1198. end
  1199. else
  1200. begin
  1201. tmpreg1:=getintregister(list,OS_ADDR);
  1202. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,ref.index));
  1203. ref.base:=tmpreg1;
  1204. ref.index:=NR_NO;
  1205. end;
  1206. end;
  1207. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  1208. Result := ref;
  1209. end;
  1210. procedure tbasecgarm.a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);
  1211. var
  1212. oppostfix:toppostfix;
  1213. usedtmpref: treference;
  1214. tmpreg : tregister;
  1215. dir : integer;
  1216. begin
  1217. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  1218. FromSize := ToSize;
  1219. case ToSize of
  1220. { signed integer registers }
  1221. OS_8,
  1222. OS_S8:
  1223. oppostfix:=PF_B;
  1224. OS_16,
  1225. OS_S16:
  1226. oppostfix:=PF_H;
  1227. OS_32,
  1228. OS_S32,
  1229. { for vfp value stored in integer register }
  1230. OS_F32:
  1231. oppostfix:=PF_None;
  1232. else
  1233. InternalError(200308299);
  1234. end;
  1235. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[tosize]) then
  1236. begin
  1237. if target_info.endian=endian_big then
  1238. dir:=-1
  1239. else
  1240. dir:=1;
  1241. case FromSize of
  1242. OS_16,OS_S16:
  1243. begin
  1244. tmpreg:=getintregister(list,OS_INT);
  1245. usedtmpref:=ref;
  1246. if target_info.endian=endian_big then
  1247. inc(usedtmpref.offset,1);
  1248. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1249. inc(usedtmpref.offset,dir);
  1250. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1251. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1252. end;
  1253. OS_32,OS_S32:
  1254. begin
  1255. tmpreg:=getintregister(list,OS_INT);
  1256. usedtmpref:=ref;
  1257. if ref.alignment=2 then
  1258. begin
  1259. if target_info.endian=endian_big then
  1260. inc(usedtmpref.offset,2);
  1261. usedtmpref:=a_internal_load_reg_ref(list,OS_16,OS_16,reg,usedtmpref);
  1262. a_op_const_reg_reg(list,OP_SHR,OS_INT,16,reg,tmpreg);
  1263. inc(usedtmpref.offset,dir*2);
  1264. a_internal_load_reg_ref(list,OS_16,OS_16,tmpreg,usedtmpref);
  1265. end
  1266. else
  1267. begin
  1268. if target_info.endian=endian_big then
  1269. inc(usedtmpref.offset,3);
  1270. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1271. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1272. inc(usedtmpref.offset,dir);
  1273. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1274. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1275. inc(usedtmpref.offset,dir);
  1276. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1277. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1278. inc(usedtmpref.offset,dir);
  1279. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1280. end;
  1281. end
  1282. else
  1283. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1284. end;
  1285. end
  1286. else
  1287. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1288. end;
  1289. function tbasecgarm.a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  1290. var
  1291. oppostfix:toppostfix;
  1292. begin
  1293. case ToSize of
  1294. { signed integer registers }
  1295. OS_8,
  1296. OS_S8:
  1297. oppostfix:=PF_B;
  1298. OS_16,
  1299. OS_S16:
  1300. oppostfix:=PF_H;
  1301. OS_32,
  1302. OS_S32:
  1303. oppostfix:=PF_None;
  1304. else
  1305. InternalError(2003082910);
  1306. end;
  1307. result:=handle_load_store(list,A_STR,oppostfix,reg,ref);
  1308. end;
  1309. function tbasecgarm.a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  1310. var
  1311. oppostfix:toppostfix;
  1312. begin
  1313. case FromSize of
  1314. { signed integer registers }
  1315. OS_8:
  1316. oppostfix:=PF_B;
  1317. OS_S8:
  1318. oppostfix:=PF_SB;
  1319. OS_16:
  1320. oppostfix:=PF_H;
  1321. OS_S16:
  1322. oppostfix:=PF_SH;
  1323. OS_32,
  1324. OS_S32:
  1325. oppostfix:=PF_None;
  1326. else
  1327. InternalError(200308291);
  1328. end;
  1329. result:=handle_load_store(list,A_LDR,oppostfix,reg,ref);
  1330. end;
  1331. procedure tbasecgarm.a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);
  1332. var
  1333. so : tshifterop;
  1334. procedure do_shift(shiftmode : tshiftmode; shiftimm : byte; reg : tregister);
  1335. begin
  1336. if GenerateThumbCode then
  1337. begin
  1338. case shiftmode of
  1339. SM_ASR:
  1340. a_op_const_reg_reg(list,OP_SAR,OS_32,shiftimm,reg,reg2);
  1341. SM_LSR:
  1342. a_op_const_reg_reg(list,OP_SHR,OS_32,shiftimm,reg,reg2);
  1343. SM_LSL:
  1344. a_op_const_reg_reg(list,OP_SHL,OS_32,shiftimm,reg,reg2);
  1345. else
  1346. internalerror(2013090301);
  1347. end;
  1348. end
  1349. else
  1350. begin
  1351. so.shiftmode:=shiftmode;
  1352. so.shiftimm:=shiftimm;
  1353. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,reg2,reg,so));
  1354. end;
  1355. end;
  1356. var
  1357. instr: taicpu;
  1358. conv_done: boolean;
  1359. begin
  1360. if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then
  1361. internalerror(2002090901);
  1362. conv_done:=false;
  1363. if tosize<>fromsize then
  1364. begin
  1365. shifterop_reset(so);
  1366. conv_done:=true;
  1367. if tcgsize2size[tosize]<=tcgsize2size[fromsize] then
  1368. fromsize:=tosize;
  1369. if current_settings.cputype<cpu_armv6 then
  1370. case fromsize of
  1371. OS_8:
  1372. if GenerateThumbCode then
  1373. a_op_const_reg_reg(list,OP_AND,OS_32,$ff,reg1,reg2)
  1374. else
  1375. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1376. OS_S8:
  1377. begin
  1378. do_shift(SM_LSL,24,reg1);
  1379. if tosize=OS_16 then
  1380. begin
  1381. do_shift(SM_ASR,8,reg2);
  1382. do_shift(SM_LSR,16,reg2);
  1383. end
  1384. else
  1385. do_shift(SM_ASR,24,reg2);
  1386. end;
  1387. OS_16:
  1388. begin
  1389. do_shift(SM_LSL,16,reg1);
  1390. do_shift(SM_LSR,16,reg2);
  1391. end;
  1392. OS_S16:
  1393. begin
  1394. do_shift(SM_LSL,16,reg1);
  1395. do_shift(SM_ASR,16,reg2)
  1396. end;
  1397. else
  1398. conv_done:=false;
  1399. end
  1400. else
  1401. case fromsize of
  1402. OS_8:
  1403. if GenerateThumbCode then
  1404. list.concat(taicpu.op_reg_reg(A_UXTB,reg2,reg1))
  1405. else
  1406. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1407. OS_S8:
  1408. begin
  1409. if tosize=OS_16 then
  1410. begin
  1411. so.shiftmode:=SM_ROR;
  1412. so.shiftimm:=16;
  1413. list.concat(taicpu.op_reg_reg_shifterop(A_SXTB16,reg2,reg1,so));
  1414. do_shift(SM_LSR,16,reg2);
  1415. end
  1416. else
  1417. list.concat(taicpu.op_reg_reg(A_SXTB,reg2,reg1));
  1418. end;
  1419. OS_16:
  1420. list.concat(taicpu.op_reg_reg(A_UXTH,reg2,reg1));
  1421. OS_S16:
  1422. list.concat(taicpu.op_reg_reg(A_SXTH,reg2,reg1));
  1423. else
  1424. conv_done:=false;
  1425. end
  1426. end;
  1427. if not conv_done and (reg1<>reg2) then
  1428. begin
  1429. { same size, only a register mov required }
  1430. instr:=taicpu.op_reg_reg(A_MOV,reg2,reg1);
  1431. list.Concat(instr);
  1432. { Notify the register allocator that we have written a move instruction so
  1433. it can try to eliminate it. }
  1434. add_move_instruction(instr);
  1435. end;
  1436. end;
  1437. procedure tbasecgarm.a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);
  1438. var
  1439. href,href2 : treference;
  1440. hloc : pcgparalocation;
  1441. begin
  1442. href:=ref;
  1443. hloc:=paraloc.location;
  1444. while assigned(hloc) do
  1445. begin
  1446. case hloc^.loc of
  1447. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  1448. begin
  1449. paramanager.allocparaloc(list,paraloc.location);
  1450. a_loadfpu_ref_reg(list,size,size,ref,hloc^.register);
  1451. end;
  1452. LOC_REGISTER :
  1453. case hloc^.size of
  1454. OS_32,
  1455. OS_F32:
  1456. begin
  1457. paramanager.allocparaloc(list,paraloc.location);
  1458. a_load_ref_reg(list,OS_32,OS_32,href,hloc^.register);
  1459. end;
  1460. OS_64,
  1461. OS_F64:
  1462. cg64.a_load64_ref_cgpara(list,href,paraloc);
  1463. else
  1464. a_load_ref_reg(list,hloc^.size,hloc^.size,href,hloc^.register);
  1465. end;
  1466. LOC_REFERENCE :
  1467. begin
  1468. reference_reset_base(href2,hloc^.reference.index,hloc^.reference.offset,paraloc.alignment);
  1469. { concatcopy should choose the best way to copy the data }
  1470. g_concatcopy(list,href,href2,tcgsize2size[hloc^.size]);
  1471. end;
  1472. else
  1473. internalerror(200408241);
  1474. end;
  1475. inc(href.offset,tcgsize2size[hloc^.size]);
  1476. hloc:=hloc^.next;
  1477. end;
  1478. end;
  1479. procedure tbasecgarm.a_loadfpu_reg_reg(list: TAsmList; fromsize,tosize: tcgsize; reg1, reg2: tregister);
  1480. begin
  1481. list.concat(setoppostfix(taicpu.op_reg_reg(A_MVF,reg2,reg1),cgsize2fpuoppostfix[tosize]));
  1482. end;
  1483. procedure tbasecgarm.a_loadfpu_ref_reg(list: TAsmList; fromsize,tosize: tcgsize; const ref: treference; reg: tregister);
  1484. var
  1485. oppostfix:toppostfix;
  1486. begin
  1487. case fromsize of
  1488. OS_32,
  1489. OS_F32:
  1490. oppostfix:=PF_S;
  1491. OS_64,
  1492. OS_F64:
  1493. oppostfix:=PF_D;
  1494. OS_F80:
  1495. oppostfix:=PF_E;
  1496. else
  1497. InternalError(200309021);
  1498. end;
  1499. handle_load_store(list,A_LDF,oppostfix,reg,ref);
  1500. if fromsize<>tosize then
  1501. a_loadfpu_reg_reg(list,fromsize,tosize,reg,reg);
  1502. end;
  1503. procedure tbasecgarm.a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);
  1504. var
  1505. oppostfix:toppostfix;
  1506. begin
  1507. case tosize of
  1508. OS_F32:
  1509. oppostfix:=PF_S;
  1510. OS_F64:
  1511. oppostfix:=PF_D;
  1512. OS_F80:
  1513. oppostfix:=PF_E;
  1514. else
  1515. InternalError(200309022);
  1516. end;
  1517. handle_load_store(list,A_STF,oppostfix,reg,ref);
  1518. end;
  1519. { comparison operations }
  1520. procedure tbasecgarm.a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  1521. l : tasmlabel);
  1522. var
  1523. tmpreg : tregister;
  1524. b : byte;
  1525. begin
  1526. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1527. if (not(GenerateThumbCode) and is_shifter_const(a,b)) or
  1528. ((GenerateThumbCode) and is_thumb_imm(a)) then
  1529. list.concat(taicpu.op_reg_const(A_CMP,reg,a))
  1530. { CMN reg,0 and CMN reg,$80000000 are different from CMP reg,$ffffffff
  1531. and CMP reg,$7fffffff regarding the flags according to the ARM manual }
  1532. else if (a<>$7fffffff) and (a<>-1) and not(GenerateThumbCode) and is_shifter_const(-a,b) then
  1533. list.concat(taicpu.op_reg_const(A_CMN,reg,-a))
  1534. else
  1535. begin
  1536. tmpreg:=getintregister(list,size);
  1537. a_load_const_reg(list,size,a,tmpreg);
  1538. list.concat(taicpu.op_reg_reg(A_CMP,reg,tmpreg));
  1539. end;
  1540. a_jmp_cond(list,cmp_op,l);
  1541. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1542. end;
  1543. procedure tbasecgarm.a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister);
  1544. begin
  1545. if reverse then
  1546. begin
  1547. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,src));
  1548. list.Concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,31));
  1549. list.Concat(taicpu.op_reg_reg_const(A_AND,dst,dst,255));
  1550. end
  1551. { it is decided during the compilation of the system unit if this code is used or not
  1552. so no additional check for rbit is needed }
  1553. else
  1554. begin
  1555. list.Concat(taicpu.op_reg_reg(A_RBIT,dst,src));
  1556. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,dst));
  1557. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1558. list.Concat(taicpu.op_reg_const(A_CMP,dst,32));
  1559. if GenerateThumb2Code then
  1560. list.Concat(taicpu.op_cond(A_IT, C_EQ));
  1561. list.Concat(setcondition(taicpu.op_reg_const(A_MOV,dst,$ff),C_EQ));
  1562. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1563. end;
  1564. end;
  1565. procedure tbasecgarm.a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel);
  1566. begin
  1567. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1568. list.concat(taicpu.op_reg_reg(A_CMP,reg2,reg1));
  1569. a_jmp_cond(list,cmp_op,l);
  1570. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1571. end;
  1572. procedure tbasecgarm.a_jmp_name(list : TAsmList;const s : string);
  1573. var
  1574. ai : taicpu;
  1575. begin
  1576. { generate far jump, leave it to the optimizer to get rid of it }
  1577. if GenerateThumbCode then
  1578. ai:=taicpu.op_sym(A_BL,current_asmdata.RefAsmSymbol(s))
  1579. else
  1580. ai:=taicpu.op_sym(A_B,current_asmdata.RefAsmSymbol(s));
  1581. ai.is_jmp:=true;
  1582. list.concat(ai);
  1583. end;
  1584. procedure tbasecgarm.a_jmp_always(list : TAsmList;l: tasmlabel);
  1585. var
  1586. ai : taicpu;
  1587. begin
  1588. { generate far jump, leave it to the optimizer to get rid of it }
  1589. if GenerateThumbCode then
  1590. ai:=taicpu.op_sym(A_BL,l)
  1591. else
  1592. ai:=taicpu.op_sym(A_B,l);
  1593. ai.is_jmp:=true;
  1594. list.concat(ai);
  1595. end;
  1596. procedure tbasecgarm.a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel);
  1597. var
  1598. ai : taicpu;
  1599. inv_flags : TResFlags;
  1600. hlabel : TAsmLabel;
  1601. begin
  1602. if GenerateThumbCode then
  1603. begin
  1604. inv_flags:=f;
  1605. inverse_flags(inv_flags);
  1606. { the optimizer has to fix this if jump range is sufficient short }
  1607. current_asmdata.getjumplabel(hlabel);
  1608. ai:=setcondition(taicpu.op_sym(A_B,hlabel),flags_to_cond(inv_flags));
  1609. ai.is_jmp:=true;
  1610. list.concat(ai);
  1611. a_jmp_always(list,l);
  1612. a_label(list,hlabel);
  1613. end
  1614. else
  1615. begin
  1616. ai:=setcondition(taicpu.op_sym(A_B,l),flags_to_cond(f));
  1617. ai.is_jmp:=true;
  1618. list.concat(ai);
  1619. end;
  1620. end;
  1621. procedure tbasecgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  1622. begin
  1623. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  1624. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  1625. end;
  1626. procedure tbasecgarm.g_profilecode(list : TAsmList);
  1627. begin
  1628. if target_info.system = system_arm_linux then
  1629. begin
  1630. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R14]));
  1631. a_call_name(list,'__gnu_mcount_nc',false);
  1632. end
  1633. else
  1634. internalerror(2014091201);
  1635. end;
  1636. procedure tbasecgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  1637. var
  1638. ref : treference;
  1639. shift : byte;
  1640. firstfloatreg,lastfloatreg,
  1641. r : byte;
  1642. mmregs,
  1643. regs, saveregs : tcpuregisterset;
  1644. registerarea,
  1645. r7offset,
  1646. stackmisalignment : pint;
  1647. postfix: toppostfix;
  1648. imm1, imm2: DWord;
  1649. stack_parameters : Boolean;
  1650. begin
  1651. LocalSize:=align(LocalSize,4);
  1652. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  1653. { call instruction does not put anything on the stack }
  1654. registerarea:=0;
  1655. tarmprocinfo(current_procinfo).stackpaddingreg:=High(TSuperRegister);
  1656. lastfloatreg:=RS_NO;
  1657. if not(nostackframe) then
  1658. begin
  1659. firstfloatreg:=RS_NO;
  1660. mmregs:=[];
  1661. case current_settings.fputype of
  1662. fpu_fpa,
  1663. fpu_fpa10,
  1664. fpu_fpa11:
  1665. begin
  1666. { save floating point registers? }
  1667. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1668. for r:=RS_F0 to RS_F7 do
  1669. if r in regs then
  1670. begin
  1671. if firstfloatreg=RS_NO then
  1672. firstfloatreg:=r;
  1673. lastfloatreg:=r;
  1674. inc(registerarea,12);
  1675. end;
  1676. end;
  1677. fpu_vfpv2,
  1678. fpu_vfpv3,
  1679. fpu_vfpv3_d16:
  1680. begin;
  1681. mmregs:=rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall);
  1682. end;
  1683. end;
  1684. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1685. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1686. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  1687. { save int registers }
  1688. reference_reset(ref,4);
  1689. ref.index:=NR_STACK_POINTER_REG;
  1690. ref.addressmode:=AM_PREINDEXED;
  1691. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  1692. if not(target_info.system in systems_darwin) then
  1693. begin
  1694. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1695. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1696. begin
  1697. a_reg_alloc(list,NR_R12);
  1698. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  1699. end;
  1700. { the (old) ARM APCS requires saving both the stack pointer (to
  1701. crawl the stack) and the PC (to identify the function this
  1702. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  1703. and R15 -- still needs updating for EABI and Darwin, they don't
  1704. need that }
  1705. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1706. regs:=regs+[RS_FRAME_POINTER_REG,RS_R12,RS_R14,RS_R15]
  1707. else
  1708. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1709. include(regs,RS_R14);
  1710. if regs<>[] then
  1711. begin
  1712. for r:=RS_R0 to RS_R15 do
  1713. if r in regs then
  1714. inc(registerarea,4);
  1715. { if the stack is not 8 byte aligned, try to add an extra register,
  1716. so we can avoid the extra sub/add ...,#4 later (KB) }
  1717. if ((registerarea mod current_settings.alignment.localalignmax) <> 0) then
  1718. for r:=RS_R3 downto RS_R0 do
  1719. if not(r in regs) then
  1720. begin
  1721. regs:=regs+[r];
  1722. inc(registerarea,4);
  1723. tarmprocinfo(current_procinfo).stackpaddingreg:=r;
  1724. break;
  1725. end;
  1726. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  1727. end;
  1728. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1729. begin
  1730. { the framepointer now points to the saved R15, so the saved
  1731. framepointer is at R11-12 (for get_caller_frame) }
  1732. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  1733. a_reg_dealloc(list,NR_R12);
  1734. end;
  1735. end
  1736. else
  1737. begin
  1738. { always save r14 if we use r7 as the framepointer, because
  1739. the parameter offsets are hardcoded in advance and always
  1740. assume that r14 sits on the stack right behind the saved r7
  1741. }
  1742. if current_procinfo.framepointer=NR_FRAME_POINTER_REG then
  1743. include(regs,RS_FRAME_POINTER_REG);
  1744. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1745. include(regs,RS_R14);
  1746. if regs<>[] then
  1747. begin
  1748. { on Darwin, you first have to save [r4-r7,lr], and then
  1749. [r8,r10,r11] and make r7 point to the previously saved
  1750. r7 so that you can perform a stack crawl based on it
  1751. ([r7] is previous stack frame, [r7+4] is return address
  1752. }
  1753. include(regs,RS_FRAME_POINTER_REG);
  1754. saveregs:=regs-[RS_R8,RS_R10,RS_R11];
  1755. r7offset:=0;
  1756. for r:=RS_R0 to RS_R15 do
  1757. if r in saveregs then
  1758. begin
  1759. inc(registerarea,4);
  1760. if r<RS_FRAME_POINTER_REG then
  1761. inc(r7offset,4);
  1762. end;
  1763. { save the registers }
  1764. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1765. { make r7 point to the saved r7 (regardless of whether this
  1766. frame uses the framepointer, for backtrace purposes) }
  1767. if r7offset<>0 then
  1768. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_FRAME_POINTER_REG,NR_R13,r7offset))
  1769. else
  1770. list.concat(taicpu.op_reg_reg(A_MOV,NR_R7,NR_R13));
  1771. { now save the rest (if any) }
  1772. saveregs:=regs-saveregs;
  1773. if saveregs<>[] then
  1774. begin
  1775. for r:=RS_R8 to RS_R11 do
  1776. if r in saveregs then
  1777. inc(registerarea,4);
  1778. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1779. end;
  1780. end;
  1781. end;
  1782. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  1783. if (LocalSize<>0) or
  1784. ((stackmisalignment<>0) and
  1785. ((pi_do_call in current_procinfo.flags) or
  1786. (po_assembler in current_procinfo.procdef.procoptions))) then
  1787. begin
  1788. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  1789. if stack_parameters and (pi_estimatestacksize in current_procinfo.flags) then
  1790. begin
  1791. if localsize>tarmprocinfo(current_procinfo).stackframesize then
  1792. internalerror(2014030901)
  1793. else
  1794. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea;
  1795. end;
  1796. if is_shifter_const(localsize,shift) then
  1797. begin
  1798. a_reg_dealloc(list,NR_R12);
  1799. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  1800. end
  1801. else if split_into_shifter_const(localsize, imm1, imm2) then
  1802. begin
  1803. a_reg_dealloc(list,NR_R12);
  1804. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  1805. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  1806. end
  1807. else
  1808. begin
  1809. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  1810. a_reg_alloc(list,NR_R12);
  1811. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  1812. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  1813. a_reg_dealloc(list,NR_R12);
  1814. end;
  1815. end;
  1816. if (mmregs<>[]) or
  1817. (firstfloatreg<>RS_NO) then
  1818. begin
  1819. reference_reset(ref,4);
  1820. if (tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023) or
  1821. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv3_d16]) then
  1822. begin
  1823. if not is_shifter_const(tarmprocinfo(current_procinfo).floatregstart,shift) then
  1824. begin
  1825. a_reg_alloc(list,NR_R12);
  1826. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  1827. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1828. a_reg_dealloc(list,NR_R12);
  1829. end
  1830. else
  1831. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tarmprocinfo(current_procinfo).floatregstart));
  1832. ref.base:=NR_R12;
  1833. end
  1834. else
  1835. begin
  1836. ref.base:=current_procinfo.framepointer;
  1837. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  1838. end;
  1839. case current_settings.fputype of
  1840. fpu_fpa,
  1841. fpu_fpa10,
  1842. fpu_fpa11:
  1843. begin
  1844. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  1845. lastfloatreg-firstfloatreg+1,ref));
  1846. end;
  1847. fpu_vfpv2,
  1848. fpu_vfpv3,
  1849. fpu_vfpv3_d16:
  1850. begin
  1851. ref.index:=ref.base;
  1852. ref.base:=NR_NO;
  1853. { FSTMX is deprecated on ARMv6 and later }
  1854. {if (current_settings.cputype<cpu_armv6) then
  1855. postfix:=PF_IAX
  1856. else
  1857. postfix:=PF_IAD;}
  1858. list.concat(taicpu.op_ref_regset(A_VSTM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  1859. end;
  1860. end;
  1861. end;
  1862. end;
  1863. end;
  1864. procedure tbasecgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  1865. var
  1866. ref : treference;
  1867. LocalSize : longint;
  1868. firstfloatreg,lastfloatreg,
  1869. r,
  1870. shift : byte;
  1871. mmregs,
  1872. saveregs,
  1873. regs : tcpuregisterset;
  1874. registerarea,
  1875. stackmisalignment: pint;
  1876. paddingreg: TSuperRegister;
  1877. mmpostfix: toppostfix;
  1878. imm1, imm2: DWord;
  1879. begin
  1880. if not(nostackframe) then
  1881. begin
  1882. registerarea:=0;
  1883. firstfloatreg:=RS_NO;
  1884. lastfloatreg:=RS_NO;
  1885. mmregs:=[];
  1886. saveregs:=[];
  1887. case current_settings.fputype of
  1888. fpu_fpa,
  1889. fpu_fpa10,
  1890. fpu_fpa11:
  1891. begin
  1892. { restore floating point registers? }
  1893. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1894. for r:=RS_F0 to RS_F7 do
  1895. if r in regs then
  1896. begin
  1897. if firstfloatreg=RS_NO then
  1898. firstfloatreg:=r;
  1899. lastfloatreg:=r;
  1900. { floating point register space is already included in
  1901. localsize below by calc_stackframe_size
  1902. inc(registerarea,12);
  1903. }
  1904. end;
  1905. end;
  1906. fpu_vfpv2,
  1907. fpu_vfpv3,
  1908. fpu_vfpv3_d16:
  1909. begin;
  1910. { restore vfp registers? }
  1911. mmregs:=rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall);
  1912. end;
  1913. end;
  1914. if (firstfloatreg<>RS_NO) or
  1915. (mmregs<>[]) then
  1916. begin
  1917. reference_reset(ref,4);
  1918. if (tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023) or
  1919. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv3_d16]) then
  1920. begin
  1921. if not is_shifter_const(tarmprocinfo(current_procinfo).floatregstart,shift) then
  1922. begin
  1923. a_reg_alloc(list,NR_R12);
  1924. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  1925. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1926. a_reg_dealloc(list,NR_R12);
  1927. end
  1928. else
  1929. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tarmprocinfo(current_procinfo).floatregstart));
  1930. ref.base:=NR_R12;
  1931. end
  1932. else
  1933. begin
  1934. ref.base:=current_procinfo.framepointer;
  1935. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  1936. end;
  1937. case current_settings.fputype of
  1938. fpu_fpa,
  1939. fpu_fpa10,
  1940. fpu_fpa11:
  1941. begin
  1942. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  1943. lastfloatreg-firstfloatreg+1,ref));
  1944. end;
  1945. fpu_vfpv2,
  1946. fpu_vfpv3,
  1947. fpu_vfpv3_d16:
  1948. begin
  1949. ref.index:=ref.base;
  1950. ref.base:=NR_NO;
  1951. { FLDMX is deprecated on ARMv6 and later }
  1952. {if (current_settings.cputype<cpu_armv6) then
  1953. mmpostfix:=PF_IAX
  1954. else
  1955. mmpostfix:=PF_IAD;}
  1956. list.concat(taicpu.op_ref_regset(A_VLDM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  1957. end;
  1958. end;
  1959. end;
  1960. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  1961. if (pi_do_call in current_procinfo.flags) or
  1962. (regs<>[]) or
  1963. ((target_info.system in systems_darwin) and
  1964. (current_procinfo.framepointer<>NR_STACK_POINTER_REG)) then
  1965. begin
  1966. exclude(regs,RS_R14);
  1967. include(regs,RS_R15);
  1968. if (target_info.system in systems_darwin) then
  1969. include(regs,RS_FRAME_POINTER_REG);
  1970. end;
  1971. if not(target_info.system in systems_darwin) then
  1972. begin
  1973. { restore saved stack pointer to SP (R13) and saved lr to PC (R15).
  1974. The saved PC came after that but is discarded, since we restore
  1975. the stack pointer }
  1976. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  1977. regs:=regs+[RS_FRAME_POINTER_REG,RS_R13,RS_R15];
  1978. end
  1979. else
  1980. begin
  1981. { restore R8-R11 already if necessary (they've been stored
  1982. before the others) }
  1983. saveregs:=regs*[RS_R8,RS_R10,RS_R11];
  1984. if saveregs<>[] then
  1985. begin
  1986. reference_reset(ref,4);
  1987. ref.index:=NR_STACK_POINTER_REG;
  1988. ref.addressmode:=AM_PREINDEXED;
  1989. for r:=RS_R8 to RS_R11 do
  1990. if r in saveregs then
  1991. inc(registerarea,4);
  1992. regs:=regs-saveregs;
  1993. end;
  1994. end;
  1995. for r:=RS_R0 to RS_R15 do
  1996. if r in regs then
  1997. inc(registerarea,4);
  1998. { reapply the stack padding reg, in case there was one, see the complimentary
  1999. comment in g_proc_entry() (KB) }
  2000. paddingreg:=tarmprocinfo(current_procinfo).stackpaddingreg;
  2001. if paddingreg < RS_R4 then
  2002. if paddingreg in regs then
  2003. internalerror(201306190)
  2004. else
  2005. begin
  2006. regs:=regs+[paddingreg];
  2007. inc(registerarea,4);
  2008. end;
  2009. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  2010. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  2011. (target_info.system in systems_darwin) then
  2012. begin
  2013. LocalSize:=current_procinfo.calc_stackframe_size;
  2014. if (LocalSize<>0) or
  2015. ((stackmisalignment<>0) and
  2016. ((pi_do_call in current_procinfo.flags) or
  2017. (po_assembler in current_procinfo.procdef.procoptions))) then
  2018. begin
  2019. if pi_estimatestacksize in current_procinfo.flags then
  2020. LocalSize:=tarmprocinfo(current_procinfo).stackframesize-registerarea
  2021. else
  2022. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  2023. if is_shifter_const(LocalSize,shift) then
  2024. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  2025. else if split_into_shifter_const(localsize, imm1, imm2) then
  2026. begin
  2027. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  2028. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  2029. end
  2030. else
  2031. begin
  2032. a_reg_alloc(list,NR_R12);
  2033. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  2034. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  2035. a_reg_dealloc(list,NR_R12);
  2036. end;
  2037. end;
  2038. if (target_info.system in systems_darwin) and
  2039. (saveregs<>[]) then
  2040. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  2041. if regs=[] then
  2042. begin
  2043. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2044. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2045. else
  2046. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2047. end
  2048. else
  2049. begin
  2050. reference_reset(ref,4);
  2051. ref.index:=NR_STACK_POINTER_REG;
  2052. ref.addressmode:=AM_PREINDEXED;
  2053. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  2054. end;
  2055. end
  2056. else
  2057. begin
  2058. { restore int registers and return }
  2059. reference_reset(ref,4);
  2060. ref.index:=NR_FRAME_POINTER_REG;
  2061. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_EA));
  2062. end;
  2063. end
  2064. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2065. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2066. else
  2067. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2068. end;
  2069. procedure tbasecgarm.g_maybe_got_init(list : TAsmList);
  2070. var
  2071. ref : treference;
  2072. l : TAsmLabel;
  2073. regs : tcpuregisterset;
  2074. r: byte;
  2075. begin
  2076. if (cs_create_pic in current_settings.moduleswitches) and
  2077. (pi_needs_got in current_procinfo.flags) and
  2078. (tf_pic_uses_got in target_info.flags) then
  2079. begin
  2080. { Procedure parametrs are not initialized at this stage.
  2081. Before GOT initialization code, allocate registers used for procedure parameters
  2082. to prevent usage of these registers for temp operations in later stages of code
  2083. generation. }
  2084. regs:=rg[R_INTREGISTER].used_in_proc;
  2085. for r:=RS_R0 to RS_R3 do
  2086. if r in regs then
  2087. a_reg_alloc(list, newreg(R_INTREGISTER,r,R_SUBWHOLE));
  2088. { Allocate scratch register R12 and use it for GOT calculations directly.
  2089. Otherwise the init code can be distorted in later stages of code generation. }
  2090. a_reg_alloc(list,NR_R12);
  2091. reference_reset(ref,4);
  2092. current_asmdata.getdatalabel(l);
  2093. cg.a_label(current_procinfo.aktlocaldata,l);
  2094. ref.symbol:=l;
  2095. ref.base:=NR_PC;
  2096. ref.symboldata:=current_procinfo.aktlocaldata.last;
  2097. list.concat(Taicpu.op_reg_ref(A_LDR,NR_R12,ref));
  2098. current_asmdata.getaddrlabel(l);
  2099. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_32bit,l,current_asmdata.RefAsmSymbol('_GLOBAL_OFFSET_TABLE_'),-8));
  2100. cg.a_label(list,l);
  2101. list.concat(Taicpu.op_reg_reg_reg(A_ADD,NR_R12,NR_PC,NR_R12));
  2102. list.concat(Taicpu.op_reg_reg(A_MOV,current_procinfo.got,NR_R12));
  2103. { Deallocate registers }
  2104. a_reg_dealloc(list,NR_R12);
  2105. for r:=RS_R3 downto RS_R0 do
  2106. if r in regs then
  2107. a_reg_dealloc(list, newreg(R_INTREGISTER,r,R_SUBWHOLE));
  2108. end;
  2109. end;
  2110. procedure tbasecgarm.a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);
  2111. var
  2112. b : byte;
  2113. tmpref : treference;
  2114. instr : taicpu;
  2115. begin
  2116. if ref.addressmode<>AM_OFFSET then
  2117. internalerror(200309071);
  2118. tmpref:=ref;
  2119. { Be sure to have a base register }
  2120. if (tmpref.base=NR_NO) then
  2121. begin
  2122. if tmpref.shiftmode<>SM_None then
  2123. internalerror(2014020702);
  2124. if tmpref.signindex<0 then
  2125. internalerror(200312023);
  2126. tmpref.base:=tmpref.index;
  2127. tmpref.index:=NR_NO;
  2128. end;
  2129. if assigned(tmpref.symbol) or
  2130. not((is_shifter_const(tmpref.offset,b)) or
  2131. (is_shifter_const(-tmpref.offset,b))
  2132. ) then
  2133. fixref(list,tmpref);
  2134. { expect a base here if there is an index }
  2135. if (tmpref.base=NR_NO) and (tmpref.index<>NR_NO) then
  2136. internalerror(200312022);
  2137. if tmpref.index<>NR_NO then
  2138. begin
  2139. if tmpref.shiftmode<>SM_None then
  2140. internalerror(200312021);
  2141. if tmpref.signindex<0 then
  2142. a_op_reg_reg_reg(list,OP_SUB,OS_ADDR,tmpref.base,tmpref.index,r)
  2143. else
  2144. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpref.base,tmpref.index,r);
  2145. if tmpref.offset<>0 then
  2146. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,r,r);
  2147. end
  2148. else
  2149. begin
  2150. if tmpref.base=NR_NO then
  2151. a_load_const_reg(list,OS_ADDR,tmpref.offset,r)
  2152. else
  2153. if tmpref.offset<>0 then
  2154. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,tmpref.base,r)
  2155. else
  2156. begin
  2157. instr:=taicpu.op_reg_reg(A_MOV,r,tmpref.base);
  2158. list.concat(instr);
  2159. add_move_instruction(instr);
  2160. end;
  2161. end;
  2162. end;
  2163. procedure tbasecgarm.fixref(list : TAsmList;var ref : treference);
  2164. var
  2165. tmpreg, tmpreg2 : tregister;
  2166. tmpref : treference;
  2167. l, piclabel : tasmlabel;
  2168. indirection_done : boolean;
  2169. begin
  2170. { absolute symbols can't be handled directly, we've to store the symbol reference
  2171. in the text segment and access it pc relative
  2172. For now, we assume that references where base or index equals to PC are already
  2173. relative, all other references are assumed to be absolute and thus they need
  2174. to be handled extra.
  2175. A proper solution would be to change refoptions to a set and store the information
  2176. if the symbol is absolute or relative there.
  2177. }
  2178. { create consts entry }
  2179. reference_reset(tmpref,4);
  2180. current_asmdata.getjumplabel(l);
  2181. cg.a_label(current_procinfo.aktlocaldata,l);
  2182. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  2183. piclabel:=nil;
  2184. tmpreg:=NR_NO;
  2185. indirection_done:=false;
  2186. if assigned(ref.symbol) then
  2187. begin
  2188. if (target_info.system=system_arm_darwin) and
  2189. (ref.symbol.bind in [AB_EXTERNAL,AB_WEAK_EXTERNAL,AB_PRIVATE_EXTERN,AB_COMMON]) then
  2190. begin
  2191. tmpreg:=g_indirect_sym_load(list,ref.symbol.name,asmsym2indsymflags(ref.symbol));
  2192. if ref.offset<>0 then
  2193. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2194. indirection_done:=true;
  2195. end
  2196. else if (cs_create_pic in current_settings.moduleswitches) then
  2197. if (tf_pic_uses_got in target_info.flags) then
  2198. current_procinfo.aktlocaldata.concat(tai_const.Create_type_sym(aitconst_got,ref.symbol))
  2199. else
  2200. begin
  2201. { ideally, we would want to generate
  2202. ldr r1, LPICConstPool
  2203. LPICLocal:
  2204. ldr/str r2,[pc,r1]
  2205. ...
  2206. LPICConstPool:
  2207. .long _globsym-(LPICLocal+8)
  2208. However, we cannot be sure that the ldr/str will follow
  2209. right after the call to fixref, so we have to load the
  2210. complete address already in a register.
  2211. }
  2212. current_asmdata.getaddrlabel(piclabel);
  2213. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_ptr,piclabel,ref.symbol,ref.offset-8));
  2214. end
  2215. else
  2216. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset))
  2217. end
  2218. else
  2219. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ref.offset));
  2220. { load consts entry }
  2221. if not indirection_done then
  2222. begin
  2223. tmpreg:=getintregister(list,OS_INT);
  2224. tmpref.symbol:=l;
  2225. tmpref.base:=NR_PC;
  2226. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2227. if (cs_create_pic in current_settings.moduleswitches) and
  2228. (tf_pic_uses_got in target_info.flags) and
  2229. assigned(ref.symbol) then
  2230. begin
  2231. reference_reset(tmpref,4);
  2232. tmpref.base:=current_procinfo.got;
  2233. tmpref.index:=tmpreg;
  2234. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2235. if ref.offset<>0 then
  2236. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2237. end;
  2238. end;
  2239. if assigned(piclabel) then
  2240. begin
  2241. cg.a_label(list,piclabel);
  2242. tmpreg2:=getaddressregister(list);
  2243. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpreg,NR_PC,tmpreg2);
  2244. tmpreg:=tmpreg2
  2245. end;
  2246. { This routine can be called with PC as base/index in case the offset
  2247. was too large to encode in a load/store. In that case, the entire
  2248. absolute expression has been re-encoded in a new constpool entry, and
  2249. we have to remove the use of PC from the original reference (the code
  2250. above made everything relative to the value loaded from the new
  2251. constpool entry) }
  2252. if is_pc(ref.base) then
  2253. ref.base:=NR_NO;
  2254. if is_pc(ref.index) then
  2255. ref.index:=NR_NO;
  2256. if (ref.base<>NR_NO) then
  2257. begin
  2258. if ref.index<>NR_NO then
  2259. begin
  2260. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  2261. ref.base:=tmpreg;
  2262. end
  2263. else
  2264. if ref.base<>NR_PC then
  2265. begin
  2266. ref.index:=tmpreg;
  2267. ref.shiftimm:=0;
  2268. ref.signindex:=1;
  2269. ref.shiftmode:=SM_None;
  2270. end
  2271. else
  2272. ref.base:=tmpreg;
  2273. end
  2274. else
  2275. ref.base:=tmpreg;
  2276. ref.offset:=0;
  2277. ref.symbol:=nil;
  2278. end;
  2279. procedure tbasecgarm.g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  2280. var
  2281. paraloc1,paraloc2,paraloc3 : TCGPara;
  2282. pd : tprocdef;
  2283. begin
  2284. pd:=search_system_proc('MOVE');
  2285. paraloc1.init;
  2286. paraloc2.init;
  2287. paraloc3.init;
  2288. paramanager.getintparaloc(pd,1,paraloc1);
  2289. paramanager.getintparaloc(pd,2,paraloc2);
  2290. paramanager.getintparaloc(pd,3,paraloc3);
  2291. a_load_const_cgpara(list,OS_SINT,len,paraloc3);
  2292. a_loadaddr_ref_cgpara(list,dest,paraloc2);
  2293. a_loadaddr_ref_cgpara(list,source,paraloc1);
  2294. paramanager.freecgpara(list,paraloc3);
  2295. paramanager.freecgpara(list,paraloc2);
  2296. paramanager.freecgpara(list,paraloc1);
  2297. alloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2298. alloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2299. a_call_name(list,'FPC_MOVE',false);
  2300. dealloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2301. dealloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2302. paraloc3.done;
  2303. paraloc2.done;
  2304. paraloc1.done;
  2305. end;
  2306. procedure tbasecgarm.g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  2307. const
  2308. maxtmpreg_arm = 10; {roozbeh: can be reduced to 8 or lower if might conflick with reserved ones,also +2 is used becouse of regs required for referencing}
  2309. maxtmpreg_thumb = 5;
  2310. var
  2311. srcref,dstref,usedtmpref,usedtmpref2:treference;
  2312. srcreg,destreg,countreg,r,tmpreg:tregister;
  2313. helpsize:aint;
  2314. copysize:byte;
  2315. cgsize:Tcgsize;
  2316. tmpregisters:array[1..maxtmpreg_arm] of tregister;
  2317. maxtmpreg,
  2318. tmpregi,tmpregi2:byte;
  2319. { will never be called with count<=4 }
  2320. procedure genloop(count : aword;size : byte);
  2321. const
  2322. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2323. var
  2324. l : tasmlabel;
  2325. begin
  2326. current_asmdata.getjumplabel(l);
  2327. if count<size then size:=1;
  2328. a_load_const_reg(list,OS_INT,count div size,countreg);
  2329. cg.a_label(list,l);
  2330. srcref.addressmode:=AM_POSTINDEXED;
  2331. dstref.addressmode:=AM_POSTINDEXED;
  2332. srcref.offset:=size;
  2333. dstref.offset:=size;
  2334. r:=getintregister(list,size2opsize[size]);
  2335. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2336. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2337. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1),PF_S));
  2338. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2339. a_jmp_flags(list,F_NE,l);
  2340. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2341. srcref.offset:=1;
  2342. dstref.offset:=1;
  2343. case count mod size of
  2344. 1:
  2345. begin
  2346. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2347. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2348. end;
  2349. 2:
  2350. if aligned then
  2351. begin
  2352. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2353. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2354. end
  2355. else
  2356. begin
  2357. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2358. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2359. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2360. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2361. end;
  2362. 3:
  2363. if aligned then
  2364. begin
  2365. srcref.offset:=2;
  2366. dstref.offset:=2;
  2367. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2368. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2369. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2370. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2371. end
  2372. else
  2373. begin
  2374. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2375. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2376. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2377. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2378. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2379. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2380. end;
  2381. end;
  2382. { keep the registers alive }
  2383. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2384. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2385. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2386. end;
  2387. { will never be called with count<=4 }
  2388. procedure genloop_thumb(count : aword;size : byte);
  2389. procedure refincofs(const ref : treference;const value : longint = 1);
  2390. begin
  2391. a_op_const_reg(list,OP_ADD,OS_ADDR,value,ref.base);
  2392. end;
  2393. const
  2394. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2395. var
  2396. l : tasmlabel;
  2397. begin
  2398. current_asmdata.getjumplabel(l);
  2399. if count<size then size:=1;
  2400. a_load_const_reg(list,OS_INT,count div size,countreg);
  2401. cg.a_label(list,l);
  2402. r:=getintregister(list,size2opsize[size]);
  2403. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2404. refincofs(srcref);
  2405. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2406. refincofs(dstref);
  2407. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2408. list.concat(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1));
  2409. a_jmp_flags(list,F_NE,l);
  2410. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2411. case count mod size of
  2412. 1:
  2413. begin
  2414. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2415. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2416. end;
  2417. 2:
  2418. if aligned then
  2419. begin
  2420. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2421. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2422. end
  2423. else
  2424. begin
  2425. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2426. refincofs(srcref);
  2427. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2428. refincofs(dstref);
  2429. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2430. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2431. end;
  2432. 3:
  2433. if aligned then
  2434. begin
  2435. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2436. refincofs(srcref,2);
  2437. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2438. refincofs(dstref,2);
  2439. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2440. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2441. end
  2442. else
  2443. begin
  2444. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2445. refincofs(srcref);
  2446. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2447. refincofs(dstref);
  2448. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2449. refincofs(srcref);
  2450. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2451. refincofs(dstref);
  2452. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2453. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2454. end;
  2455. end;
  2456. { keep the registers alive }
  2457. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2458. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2459. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2460. end;
  2461. begin
  2462. if len=0 then
  2463. exit;
  2464. if GenerateThumbCode then
  2465. maxtmpreg:=maxtmpreg_thumb
  2466. else
  2467. maxtmpreg:=maxtmpreg_arm;
  2468. helpsize:=12+maxtmpreg*4;//52 with maxtmpreg=10
  2469. dstref:=dest;
  2470. srcref:=source;
  2471. if cs_opt_size in current_settings.optimizerswitches then
  2472. helpsize:=8;
  2473. if aligned and (len=4) then
  2474. begin
  2475. tmpreg:=getintregister(list,OS_32);
  2476. a_load_ref_reg(list,OS_32,OS_32,source,tmpreg);
  2477. a_load_reg_ref(list,OS_32,OS_32,tmpreg,dest);
  2478. end
  2479. else if aligned and (len=2) then
  2480. begin
  2481. tmpreg:=getintregister(list,OS_16);
  2482. a_load_ref_reg(list,OS_16,OS_16,source,tmpreg);
  2483. a_load_reg_ref(list,OS_16,OS_16,tmpreg,dest);
  2484. end
  2485. else if (len<=helpsize) and aligned then
  2486. begin
  2487. tmpregi:=0;
  2488. srcreg:=getintregister(list,OS_ADDR);
  2489. { explicit pc relative addressing, could be
  2490. e.g. a floating point constant }
  2491. if source.base=NR_PC then
  2492. begin
  2493. { ... then we don't need a loadaddr }
  2494. srcref:=source;
  2495. end
  2496. else
  2497. begin
  2498. a_loadaddr_ref_reg(list,source,srcreg);
  2499. reference_reset_base(srcref,srcreg,0,source.alignment);
  2500. end;
  2501. while (len div 4 <> 0) and (tmpregi<maxtmpreg) do
  2502. begin
  2503. inc(tmpregi);
  2504. tmpregisters[tmpregi]:=getintregister(list,OS_32);
  2505. a_load_ref_reg(list,OS_32,OS_32,srcref,tmpregisters[tmpregi]);
  2506. inc(srcref.offset,4);
  2507. dec(len,4);
  2508. end;
  2509. destreg:=getintregister(list,OS_ADDR);
  2510. a_loadaddr_ref_reg(list,dest,destreg);
  2511. reference_reset_base(dstref,destreg,0,dest.alignment);
  2512. tmpregi2:=1;
  2513. while (tmpregi2<=tmpregi) do
  2514. begin
  2515. a_load_reg_ref(list,OS_32,OS_32,tmpregisters[tmpregi2],dstref);
  2516. inc(dstref.offset,4);
  2517. inc(tmpregi2);
  2518. end;
  2519. copysize:=4;
  2520. cgsize:=OS_32;
  2521. while len<>0 do
  2522. begin
  2523. if len<2 then
  2524. begin
  2525. copysize:=1;
  2526. cgsize:=OS_8;
  2527. end
  2528. else if len<4 then
  2529. begin
  2530. copysize:=2;
  2531. cgsize:=OS_16;
  2532. end;
  2533. dec(len,copysize);
  2534. r:=getintregister(list,cgsize);
  2535. a_load_ref_reg(list,cgsize,cgsize,srcref,r);
  2536. a_load_reg_ref(list,cgsize,cgsize,r,dstref);
  2537. inc(srcref.offset,copysize);
  2538. inc(dstref.offset,copysize);
  2539. end;{end of while}
  2540. end
  2541. else
  2542. begin
  2543. cgsize:=OS_32;
  2544. if (len<=4) then{len<=4 and not aligned}
  2545. begin
  2546. r:=getintregister(list,cgsize);
  2547. usedtmpref:=a_internal_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2548. if Len=1 then
  2549. a_load_reg_ref(list,OS_8,OS_8,r,dstref)
  2550. else
  2551. begin
  2552. tmpreg:=getintregister(list,cgsize);
  2553. usedtmpref2:=a_internal_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2554. inc(usedtmpref.offset,1);
  2555. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2556. inc(usedtmpref2.offset,1);
  2557. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2558. if len>2 then
  2559. begin
  2560. inc(usedtmpref.offset,1);
  2561. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2562. inc(usedtmpref2.offset,1);
  2563. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2564. if len>3 then
  2565. begin
  2566. inc(usedtmpref.offset,1);
  2567. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2568. inc(usedtmpref2.offset,1);
  2569. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2570. end;
  2571. end;
  2572. end;
  2573. end{end of if len<=4}
  2574. else
  2575. begin{unaligned & 4<len<helpsize **or** aligned/unaligned & len>helpsize}
  2576. destreg:=getintregister(list,OS_ADDR);
  2577. a_loadaddr_ref_reg(list,dest,destreg);
  2578. reference_reset_base(dstref,destreg,0,dest.alignment);
  2579. srcreg:=getintregister(list,OS_ADDR);
  2580. a_loadaddr_ref_reg(list,source,srcreg);
  2581. reference_reset_base(srcref,srcreg,0,source.alignment);
  2582. countreg:=getintregister(list,OS_32);
  2583. // if cs_opt_size in current_settings.optimizerswitches then
  2584. { roozbeh : it seems loading 1 byte is faster becouse of caching/fetching(?) }
  2585. {if aligned then
  2586. genloop(len,4)
  2587. else}
  2588. if GenerateThumbCode then
  2589. genloop_thumb(len,1)
  2590. else
  2591. genloop(len,1);
  2592. end;
  2593. end;
  2594. end;
  2595. procedure tbasecgarm.g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);
  2596. begin
  2597. g_concatcopy_internal(list,source,dest,len,false);
  2598. end;
  2599. procedure tbasecgarm.g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);
  2600. begin
  2601. if (source.alignment in [1,3]) or
  2602. (dest.alignment in [1,3]) then
  2603. g_concatcopy_internal(list,source,dest,len,false)
  2604. else
  2605. g_concatcopy_internal(list,source,dest,len,true);
  2606. end;
  2607. procedure tbasecgarm.g_overflowCheck(list : TAsmList;const l : tlocation;def : tdef);
  2608. var
  2609. ovloc : tlocation;
  2610. begin
  2611. ovloc.loc:=LOC_VOID;
  2612. g_overflowCheck_loc(list,l,def,ovloc);
  2613. end;
  2614. procedure tbasecgarm.g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);
  2615. var
  2616. hl : tasmlabel;
  2617. ai:TAiCpu;
  2618. hflags : tresflags;
  2619. begin
  2620. if not(cs_check_overflow in current_settings.localswitches) then
  2621. exit;
  2622. current_asmdata.getjumplabel(hl);
  2623. case ovloc.loc of
  2624. LOC_VOID:
  2625. begin
  2626. ai:=taicpu.op_sym(A_B,hl);
  2627. ai.is_jmp:=true;
  2628. if not((def.typ=pointerdef) or
  2629. ((def.typ=orddef) and
  2630. (torddef(def).ordtype in [u64bit,u16bit,u32bit,u8bit,uchar,
  2631. pasbool8,pasbool16,pasbool32,pasbool64]))) then
  2632. ai.SetCondition(C_VC)
  2633. else
  2634. if TAiCpu(List.Last).opcode in [A_RSB,A_RSC,A_SBC,A_SUB] then
  2635. ai.SetCondition(C_CS)
  2636. else
  2637. ai.SetCondition(C_CC);
  2638. list.concat(ai);
  2639. end;
  2640. LOC_FLAGS:
  2641. begin
  2642. hflags:=ovloc.resflags;
  2643. inverse_flags(hflags);
  2644. cg.a_jmp_flags(list,hflags,hl);
  2645. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2646. end;
  2647. else
  2648. internalerror(200409281);
  2649. end;
  2650. a_call_name(list,'FPC_OVERFLOW',false);
  2651. a_label(list,hl);
  2652. end;
  2653. procedure tbasecgarm.g_save_registers(list : TAsmList);
  2654. begin
  2655. { this work is done in g_proc_entry }
  2656. end;
  2657. procedure tbasecgarm.g_restore_registers(list : TAsmList);
  2658. begin
  2659. { this work is done in g_proc_exit }
  2660. end;
  2661. procedure tbasecgarm.a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  2662. var
  2663. ai : taicpu;
  2664. hlabel : TAsmLabel;
  2665. begin
  2666. if GenerateThumbCode then
  2667. begin
  2668. { the optimizer has to fix this if jump range is sufficient short }
  2669. current_asmdata.getjumplabel(hlabel);
  2670. ai:=Taicpu.Op_sym(A_B,hlabel);
  2671. ai.SetCondition(inverse_cond(OpCmp2AsmCond[cond]));
  2672. ai.is_jmp:=true;
  2673. list.concat(ai);
  2674. a_jmp_always(list,l);
  2675. a_label(list,hlabel);
  2676. end
  2677. else
  2678. begin
  2679. ai:=Taicpu.Op_sym(A_B,l);
  2680. ai.SetCondition(OpCmp2AsmCond[cond]);
  2681. ai.is_jmp:=true;
  2682. list.concat(ai);
  2683. end;
  2684. end;
  2685. function get_scalar_mm_op(fromsize,tosize : tcgsize) : tasmop;
  2686. const
  2687. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of tasmop = (
  2688. (A_VMOV,A_VCVT,A_NONE,A_NONE,A_NONE),
  2689. (A_VCVT,A_VMOV,A_NONE,A_NONE,A_NONE),
  2690. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2691. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2692. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE));
  2693. begin
  2694. result:=convertop[fromsize,tosize];
  2695. if result=A_NONE then
  2696. internalerror(200312205);
  2697. end;
  2698. function get_scalar_mm_prefix(fromsize,tosize : tcgsize) : TOpPostfix;
  2699. const
  2700. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of TOpPostfix = (
  2701. (PF_F32, PF_F32F64,PF_None,PF_None,PF_None),
  2702. (PF_F64F32,PF_F64, PF_None,PF_None,PF_None),
  2703. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2704. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2705. (PF_None, PF_None, PF_None,PF_None,PF_None));
  2706. begin
  2707. result:=convertop[fromsize,tosize];
  2708. end;
  2709. procedure tbasecgarm.a_loadmm_reg_reg(list: tasmlist; fromsize,tosize: tcgsize; reg1,reg2: tregister; shuffle: pmmshuffle);
  2710. var
  2711. instr: taicpu;
  2712. begin
  2713. if (shuffle=nil) or shufflescalar(shuffle) then
  2714. instr:=setoppostfix(taicpu.op_reg_reg(get_scalar_mm_op(tosize,fromsize),reg2,reg1),get_scalar_mm_prefix(tosize,fromsize))
  2715. else
  2716. internalerror(2009112407);
  2717. list.concat(instr);
  2718. case instr.opcode of
  2719. A_VMOV:
  2720. add_move_instruction(instr);
  2721. end;
  2722. end;
  2723. procedure tbasecgarm.a_loadmm_ref_reg(list: tasmlist; fromsize,tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  2724. var
  2725. intreg,
  2726. tmpmmreg : tregister;
  2727. reg64 : tregister64;
  2728. begin
  2729. if assigned(shuffle) and
  2730. not(shufflescalar(shuffle)) then
  2731. internalerror(2009112413);
  2732. case fromsize of
  2733. OS_32,OS_S32:
  2734. begin
  2735. fromsize:=OS_F32;
  2736. { since we are loading an integer, no conversion may be required }
  2737. if (fromsize<>tosize) then
  2738. internalerror(2009112801);
  2739. end;
  2740. OS_64,OS_S64:
  2741. begin
  2742. fromsize:=OS_F64;
  2743. { since we are loading an integer, no conversion may be required }
  2744. if (fromsize<>tosize) then
  2745. internalerror(2009112901);
  2746. end;
  2747. end;
  2748. if (fromsize<>tosize) then
  2749. tmpmmreg:=getmmregister(list,fromsize)
  2750. else
  2751. tmpmmreg:=reg;
  2752. if (ref.alignment in [1,2]) then
  2753. begin
  2754. case fromsize of
  2755. OS_F32:
  2756. begin
  2757. intreg:=getintregister(list,OS_32);
  2758. a_load_ref_reg(list,OS_32,OS_32,ref,intreg);
  2759. a_loadmm_intreg_reg(list,OS_32,OS_F32,intreg,tmpmmreg,mms_movescalar);
  2760. end;
  2761. OS_F64:
  2762. begin
  2763. reg64.reglo:=getintregister(list,OS_32);
  2764. reg64.reghi:=getintregister(list,OS_32);
  2765. cg64.a_load64_ref_reg(list,ref,reg64);
  2766. cg64.a_loadmm_intreg64_reg(list,OS_F64,reg64,tmpmmreg);
  2767. end;
  2768. else
  2769. internalerror(2009112412);
  2770. end;
  2771. end
  2772. else
  2773. begin
  2774. handle_load_store(list,A_VLDR,PF_None,tmpmmreg,ref);
  2775. end;
  2776. if (tmpmmreg<>reg) then
  2777. a_loadmm_reg_reg(list,fromsize,tosize,tmpmmreg,reg,shuffle);
  2778. end;
  2779. procedure tbasecgarm.a_loadmm_reg_ref(list: tasmlist; fromsize,tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  2780. var
  2781. intreg,
  2782. tmpmmreg : tregister;
  2783. reg64 : tregister64;
  2784. begin
  2785. if assigned(shuffle) and
  2786. not(shufflescalar(shuffle)) then
  2787. internalerror(2009112416);
  2788. case tosize of
  2789. OS_32,OS_S32:
  2790. begin
  2791. tosize:=OS_F32;
  2792. { since we are loading an integer, no conversion may be required }
  2793. if (fromsize<>tosize) then
  2794. internalerror(2009112801);
  2795. end;
  2796. OS_64,OS_S64:
  2797. begin
  2798. tosize:=OS_F64;
  2799. { since we are loading an integer, no conversion may be required }
  2800. if (fromsize<>tosize) then
  2801. internalerror(2009112901);
  2802. end;
  2803. end;
  2804. if (fromsize<>tosize) then
  2805. begin
  2806. tmpmmreg:=getmmregister(list,tosize);
  2807. a_loadmm_reg_reg(list,fromsize,tosize,reg,tmpmmreg,shuffle);
  2808. end
  2809. else
  2810. tmpmmreg:=reg;
  2811. if (ref.alignment in [1,2]) then
  2812. begin
  2813. case tosize of
  2814. OS_F32:
  2815. begin
  2816. intreg:=getintregister(list,OS_32);
  2817. a_loadmm_reg_intreg(list,OS_F32,OS_32,tmpmmreg,intreg,shuffle);
  2818. a_load_reg_ref(list,OS_32,OS_32,intreg,ref);
  2819. end;
  2820. OS_F64:
  2821. begin
  2822. reg64.reglo:=getintregister(list,OS_32);
  2823. reg64.reghi:=getintregister(list,OS_32);
  2824. cg64.a_loadmm_reg_intreg64(list,OS_F64,tmpmmreg,reg64);
  2825. cg64.a_load64_reg_ref(list,reg64,ref);
  2826. end;
  2827. else
  2828. internalerror(2009112417);
  2829. end;
  2830. end
  2831. else
  2832. begin
  2833. handle_load_store(list,A_VSTR,PF_None,tmpmmreg,ref);
  2834. end;
  2835. end;
  2836. procedure tbasecgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  2837. begin
  2838. { this code can only be used to transfer raw data, not to perform
  2839. conversions }
  2840. if (tosize<>OS_F32) then
  2841. internalerror(2009112419);
  2842. if not(fromsize in [OS_32,OS_S32]) then
  2843. internalerror(2009112420);
  2844. if assigned(shuffle) and
  2845. not shufflescalar(shuffle) then
  2846. internalerror(2009112516);
  2847. list.concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg));
  2848. end;
  2849. procedure tbasecgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize; mmreg, intreg: tregister;shuffle : pmmshuffle);
  2850. begin
  2851. { this code can only be used to transfer raw data, not to perform
  2852. conversions }
  2853. if (fromsize<>OS_F32) then
  2854. internalerror(2009112430);
  2855. if not(tosize in [OS_32,OS_S32]) then
  2856. internalerror(2009112420);
  2857. if assigned(shuffle) and
  2858. not shufflescalar(shuffle) then
  2859. internalerror(2009112514);
  2860. list.concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg));
  2861. end;
  2862. procedure tbasecgarm.a_opmm_reg_reg(list: tasmlist; op: topcg; size: tcgsize; src, dst: tregister; shuffle: pmmshuffle);
  2863. var
  2864. tmpreg: tregister;
  2865. begin
  2866. { the vfp doesn't support xor nor any other logical operation, but
  2867. this routine is used to initialise global mm regvars. We can
  2868. easily initialise an mm reg with 0 though. }
  2869. case op of
  2870. OP_XOR:
  2871. begin
  2872. if (src<>dst) or
  2873. (reg_cgsize(src)<>size) or
  2874. assigned(shuffle) then
  2875. internalerror(2009112907);
  2876. tmpreg:=getintregister(list,OS_32);
  2877. a_load_const_reg(list,OS_32,0,tmpreg);
  2878. case size of
  2879. OS_F32:
  2880. list.concat(taicpu.op_reg_reg(A_VMOV,dst,tmpreg));
  2881. OS_F64:
  2882. list.concat(taicpu.op_reg_reg_reg(A_VMOV,dst,tmpreg,tmpreg));
  2883. else
  2884. internalerror(2009112908);
  2885. end;
  2886. end
  2887. else
  2888. internalerror(2009112906);
  2889. end;
  2890. end;
  2891. procedure tbasecgarm.g_intf_wrapper(list: TAsmList; procdef: tprocdef; const labelname: string; ioffset: longint);
  2892. procedure loadvmttor12;
  2893. var
  2894. tmpref,
  2895. href : treference;
  2896. extrareg : boolean;
  2897. l : TAsmLabel;
  2898. begin
  2899. reference_reset_base(href,NR_R0,0,sizeof(pint));
  2900. if GenerateThumbCode then
  2901. begin
  2902. if (href.offset in [0..124]) and ((href.offset mod 4)=0) then
  2903. begin
  2904. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R0]));
  2905. cg.a_load_ref_reg(list,OS_ADDR,OS_ADDR,href,NR_R0);
  2906. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_R0));
  2907. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R0]));
  2908. end
  2909. else
  2910. begin
  2911. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R0,RS_R1]));
  2912. { create consts entry }
  2913. reference_reset(tmpref,4);
  2914. current_asmdata.getjumplabel(l);
  2915. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  2916. cg.a_label(current_procinfo.aktlocaldata,l);
  2917. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  2918. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(href.offset));
  2919. tmpref.symbol:=l;
  2920. tmpref.base:=NR_PC;
  2921. list.concat(taicpu.op_reg_ref(A_LDR,NR_R1,tmpref));
  2922. href.offset:=0;
  2923. href.index:=NR_R1;
  2924. cg.a_load_ref_reg(list,OS_ADDR,OS_ADDR,href,NR_R0);
  2925. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_R0));
  2926. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R0,RS_R1]));
  2927. end;
  2928. end
  2929. else
  2930. cg.a_load_ref_reg(list,OS_ADDR,OS_ADDR,href,NR_R12);
  2931. end;
  2932. procedure op_onr12methodaddr;
  2933. var
  2934. tmpref,
  2935. href : treference;
  2936. l : TAsmLabel;
  2937. begin
  2938. if (procdef.extnumber=$ffff) then
  2939. Internalerror(200006139);
  2940. if GenerateThumbCode then
  2941. begin
  2942. reference_reset_base(href,NR_R0,tobjectdef(procdef.struct).vmtmethodoffset(procdef.extnumber),sizeof(pint));
  2943. if (href.offset in [0..124]) and ((href.offset mod 4)=0) then
  2944. begin
  2945. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R0]));
  2946. list.concat(taicpu.op_reg_reg(A_MOV,NR_R0,NR_R12));
  2947. cg.a_load_ref_reg(list,OS_ADDR,OS_ADDR,href,NR_R0);
  2948. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_R0));
  2949. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R0]));
  2950. end
  2951. else
  2952. begin
  2953. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R0,RS_R1]));
  2954. { create consts entry }
  2955. reference_reset(tmpref,4);
  2956. current_asmdata.getjumplabel(l);
  2957. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  2958. cg.a_label(current_procinfo.aktlocaldata,l);
  2959. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  2960. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(href.offset));
  2961. tmpref.symbol:=l;
  2962. tmpref.base:=NR_PC;
  2963. list.concat(taicpu.op_reg_ref(A_LDR,NR_R1,tmpref));
  2964. list.concat(taicpu.op_reg_reg(A_MOV,NR_R0,NR_R12));
  2965. href.offset:=0;
  2966. href.base:=NR_R0;
  2967. href.index:=NR_R1;
  2968. cg.a_load_ref_reg(list,OS_ADDR,OS_ADDR,href,NR_R0);
  2969. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_R0));
  2970. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R0,RS_R1]));
  2971. end;
  2972. end
  2973. else
  2974. begin
  2975. reference_reset_base(href,NR_R12,tobjectdef(procdef.struct).vmtmethodoffset(procdef.extnumber),sizeof(pint));
  2976. cg.a_load_ref_reg(list,OS_ADDR,OS_ADDR,href,NR_R12);
  2977. end;
  2978. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2979. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R12))
  2980. else
  2981. list.concat(taicpu.op_reg(A_BX,NR_R12));
  2982. end;
  2983. var
  2984. make_global : boolean;
  2985. tmpref : treference;
  2986. l : TAsmLabel;
  2987. begin
  2988. if not(procdef.proctypeoption in [potype_function,potype_procedure]) then
  2989. Internalerror(200006137);
  2990. if not assigned(procdef.struct) or
  2991. (procdef.procoptions*[po_classmethod, po_staticmethod,
  2992. po_methodpointer, po_interrupt, po_iocheck]<>[]) then
  2993. Internalerror(200006138);
  2994. if procdef.owner.symtabletype<>ObjectSymtable then
  2995. Internalerror(200109191);
  2996. if GenerateThumbCode or GenerateThumb2Code then
  2997. list.concat(tai_directive.Create(asd_thumb_func,''));
  2998. make_global:=false;
  2999. if (not current_module.is_unit) or
  3000. create_smartlink or
  3001. (procdef.owner.defowner.owner.symtabletype=globalsymtable) then
  3002. make_global:=true;
  3003. if make_global then
  3004. list.concat(Tai_symbol.Createname_global(labelname,AT_FUNCTION,0))
  3005. else
  3006. list.concat(Tai_symbol.Createname(labelname,AT_FUNCTION,0));
  3007. { the wrapper might need aktlocaldata for the additional data to
  3008. load the constant }
  3009. current_procinfo:=cprocinfo.create(nil);
  3010. { set param1 interface to self }
  3011. g_adjust_self_value(list,procdef,ioffset);
  3012. { case 4 }
  3013. if (po_virtualmethod in procdef.procoptions) and
  3014. not is_objectpascal_helper(procdef.struct) then
  3015. begin
  3016. loadvmttor12;
  3017. op_onr12methodaddr;
  3018. end
  3019. { case 0 }
  3020. else if GenerateThumbCode then
  3021. begin
  3022. { bl cannot be used here because it destroys lr }
  3023. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R0]));
  3024. { create consts entry }
  3025. reference_reset(tmpref,4);
  3026. current_asmdata.getjumplabel(l);
  3027. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3028. cg.a_label(current_procinfo.aktlocaldata,l);
  3029. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3030. current_procinfo.aktlocaldata.concat(tai_const.Create_sym(current_asmdata.RefAsmSymbol(procdef.mangledname)));
  3031. tmpref.symbol:=l;
  3032. tmpref.base:=NR_PC;
  3033. cg.a_load_ref_reg(list,OS_ADDR,OS_ADDR,tmpref,NR_R0);
  3034. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_R0));
  3035. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R0]));
  3036. list.concat(taicpu.op_reg(A_BX,NR_R12));
  3037. end
  3038. else
  3039. list.concat(taicpu.op_sym(A_B,current_asmdata.RefAsmSymbol(procdef.mangledname)));
  3040. list.concatlist(current_procinfo.aktlocaldata);
  3041. current_procinfo.Free;
  3042. current_procinfo:=nil;
  3043. list.concat(Tai_symbol_end.Createname(labelname));
  3044. end;
  3045. procedure tbasecgarm.maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  3046. const
  3047. overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NEG];
  3048. begin
  3049. if (op in overflowops) and
  3050. (size in [OS_8,OS_S8,OS_16,OS_S16]) then
  3051. a_load_reg_reg(list,OS_32,size,dst,dst);
  3052. end;
  3053. procedure tbasecgarm.safe_mla(list : TAsmList; op1,op2,op3,op4 : TRegister);
  3054. procedure checkreg(var reg : TRegister);
  3055. var
  3056. tmpreg : TRegister;
  3057. begin
  3058. if ((GenerateThumbCode or GenerateThumb2Code) and (getsupreg(reg)=RS_R13)) or
  3059. (getsupreg(reg)=RS_R15) then
  3060. begin
  3061. tmpreg:=getintregister(list,OS_INT);
  3062. a_load_reg_reg(list,OS_INT,OS_INT,reg,tmpreg);
  3063. reg:=tmpreg;
  3064. end;
  3065. end;
  3066. begin
  3067. checkreg(op1);
  3068. checkreg(op2);
  3069. checkreg(op3);
  3070. checkreg(op4);
  3071. list.concat(taicpu.op_reg_reg_reg_reg(A_MLA,op1,op2,op3,op4));
  3072. end;
  3073. procedure tcg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  3074. begin
  3075. case op of
  3076. OP_NEG:
  3077. begin
  3078. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3079. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  3080. list.concat(taicpu.op_reg_reg_const(A_RSC,regdst.reghi,regsrc.reghi,0));
  3081. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3082. end;
  3083. OP_NOT:
  3084. begin
  3085. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  3086. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  3087. end;
  3088. else
  3089. a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);
  3090. end;
  3091. end;
  3092. procedure tcg64farm.a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);
  3093. begin
  3094. a_op64_const_reg_reg(list,op,size,value,reg,reg);
  3095. end;
  3096. procedure tcg64farm.a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);
  3097. var
  3098. ovloc : tlocation;
  3099. begin
  3100. a_op64_const_reg_reg_checkoverflow(list,op,size,value,regsrc,regdst,false,ovloc);
  3101. end;
  3102. procedure tcg64farm.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);
  3103. var
  3104. ovloc : tlocation;
  3105. begin
  3106. a_op64_reg_reg_reg_checkoverflow(list,op,size,regsrc1,regsrc2,regdst,false,ovloc);
  3107. end;
  3108. procedure tcg64farm.a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);
  3109. begin
  3110. { this code can only be used to transfer raw data, not to perform
  3111. conversions }
  3112. if (mmsize<>OS_F64) then
  3113. internalerror(2009112405);
  3114. list.concat(taicpu.op_reg_reg_reg(A_VMOV,mmreg,intreg.reglo,intreg.reghi));
  3115. end;
  3116. procedure tcg64farm.a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);
  3117. begin
  3118. { this code can only be used to transfer raw data, not to perform
  3119. conversions }
  3120. if (mmsize<>OS_F64) then
  3121. internalerror(2009112406);
  3122. list.concat(taicpu.op_reg_reg_reg(A_VMOV,intreg.reglo,intreg.reghi,mmreg));
  3123. end;
  3124. procedure tcg64farm.a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3125. var
  3126. tmpreg : tregister;
  3127. b : byte;
  3128. begin
  3129. ovloc.loc:=LOC_VOID;
  3130. case op of
  3131. OP_NEG,
  3132. OP_NOT :
  3133. internalerror(2012022501);
  3134. end;
  3135. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3136. begin
  3137. case op of
  3138. OP_ADD:
  3139. begin
  3140. if is_shifter_const(lo(value),b) then
  3141. begin
  3142. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3143. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3144. end
  3145. else
  3146. begin
  3147. tmpreg:=cg.getintregister(list,OS_32);
  3148. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3149. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3150. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3151. end;
  3152. if is_shifter_const(hi(value),b) then
  3153. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,hi(value)),PF_S))
  3154. else
  3155. begin
  3156. tmpreg:=cg.getintregister(list,OS_32);
  3157. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3158. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3159. end;
  3160. end;
  3161. OP_SUB:
  3162. begin
  3163. if is_shifter_const(lo(value),b) then
  3164. begin
  3165. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3166. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3167. end
  3168. else
  3169. begin
  3170. tmpreg:=cg.getintregister(list,OS_32);
  3171. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3172. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3173. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3174. end;
  3175. if is_shifter_const(hi(value),b) then
  3176. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))),PF_S))
  3177. else
  3178. begin
  3179. tmpreg:=cg.getintregister(list,OS_32);
  3180. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3181. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3182. end;
  3183. end;
  3184. else
  3185. internalerror(200502131);
  3186. end;
  3187. if size=OS_64 then
  3188. begin
  3189. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3190. ovloc.loc:=LOC_FLAGS;
  3191. case op of
  3192. OP_ADD:
  3193. ovloc.resflags:=F_CS;
  3194. OP_SUB:
  3195. ovloc.resflags:=F_CC;
  3196. end;
  3197. end;
  3198. end
  3199. else
  3200. begin
  3201. case op of
  3202. OP_AND,OP_OR,OP_XOR:
  3203. begin
  3204. cg.a_op_const_reg_reg(list,op,OS_32,aint(lo(value)),regsrc.reglo,regdst.reglo);
  3205. cg.a_op_const_reg_reg(list,op,OS_32,aint(hi(value)),regsrc.reghi,regdst.reghi);
  3206. end;
  3207. OP_ADD:
  3208. begin
  3209. if is_shifter_const(aint(lo(value)),b) then
  3210. begin
  3211. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3212. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3213. end
  3214. else
  3215. begin
  3216. tmpreg:=cg.getintregister(list,OS_32);
  3217. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3218. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3219. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3220. end;
  3221. if is_shifter_const(aint(hi(value)),b) then
  3222. list.concat(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3223. else
  3224. begin
  3225. tmpreg:=cg.getintregister(list,OS_32);
  3226. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  3227. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg));
  3228. end;
  3229. end;
  3230. OP_SUB:
  3231. begin
  3232. if is_shifter_const(aint(lo(value)),b) then
  3233. begin
  3234. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3235. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3236. end
  3237. else
  3238. begin
  3239. tmpreg:=cg.getintregister(list,OS_32);
  3240. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3241. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3242. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3243. end;
  3244. if is_shifter_const(aint(hi(value)),b) then
  3245. list.concat(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3246. else
  3247. begin
  3248. tmpreg:=cg.getintregister(list,OS_32);
  3249. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3250. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg));
  3251. end;
  3252. end;
  3253. else
  3254. internalerror(2003083101);
  3255. end;
  3256. end;
  3257. end;
  3258. procedure tcg64farm.a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3259. begin
  3260. ovloc.loc:=LOC_VOID;
  3261. case op of
  3262. OP_NEG,
  3263. OP_NOT :
  3264. internalerror(2012022502);
  3265. end;
  3266. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3267. begin
  3268. case op of
  3269. OP_ADD:
  3270. begin
  3271. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3272. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3273. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi),PF_S));
  3274. end;
  3275. OP_SUB:
  3276. begin
  3277. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3278. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3279. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi),PF_S));
  3280. end;
  3281. else
  3282. internalerror(2003083101);
  3283. end;
  3284. if size=OS_64 then
  3285. begin
  3286. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3287. ovloc.loc:=LOC_FLAGS;
  3288. case op of
  3289. OP_ADD:
  3290. ovloc.resflags:=F_CS;
  3291. OP_SUB:
  3292. ovloc.resflags:=F_CC;
  3293. end;
  3294. end;
  3295. end
  3296. else
  3297. begin
  3298. case op of
  3299. OP_AND,OP_OR,OP_XOR:
  3300. begin
  3301. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);
  3302. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);
  3303. end;
  3304. OP_ADD:
  3305. begin
  3306. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3307. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3308. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi));
  3309. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3310. end;
  3311. OP_SUB:
  3312. begin
  3313. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3314. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3315. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi));
  3316. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3317. end;
  3318. else
  3319. internalerror(2003083101);
  3320. end;
  3321. end;
  3322. end;
  3323. procedure tthumbcgarm.init_register_allocators;
  3324. begin
  3325. inherited init_register_allocators;
  3326. if assigned(current_procinfo) and (current_procinfo.framepointer=NR_R7) then
  3327. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3328. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6],first_int_imreg,[])
  3329. else
  3330. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3331. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7],first_int_imreg,[]);
  3332. end;
  3333. procedure tthumbcgarm.done_register_allocators;
  3334. begin
  3335. rg[R_INTREGISTER].free;
  3336. rg[R_FPUREGISTER].free;
  3337. rg[R_MMREGISTER].free;
  3338. inherited done_register_allocators;
  3339. end;
  3340. procedure tthumbcgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  3341. var
  3342. ref : treference;
  3343. shift : byte;
  3344. r : byte;
  3345. regs, saveregs : tcpuregisterset;
  3346. r7offset,
  3347. stackmisalignment : pint;
  3348. postfix: toppostfix;
  3349. registerarea,
  3350. imm1, imm2: DWord;
  3351. stack_parameters: Boolean;
  3352. begin
  3353. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3354. LocalSize:=align(LocalSize,4);
  3355. { call instruction does not put anything on the stack }
  3356. stackmisalignment:=0;
  3357. if not(nostackframe) then
  3358. begin
  3359. a_reg_alloc(list,NR_STACK_POINTER_REG);
  3360. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3361. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  3362. { save int registers }
  3363. reference_reset(ref,4);
  3364. ref.index:=NR_STACK_POINTER_REG;
  3365. ref.addressmode:=AM_PREINDEXED;
  3366. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3367. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3368. begin
  3369. //!!!! a_reg_alloc(list,NR_R12);
  3370. //!!!! list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  3371. end;
  3372. { the (old) ARM APCS requires saving both the stack pointer (to
  3373. crawl the stack) and the PC (to identify the function this
  3374. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  3375. and R15 -- still needs updating for EABI and Darwin, they don't
  3376. need that }
  3377. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3378. regs:=regs+[RS_R7,RS_R14]
  3379. else
  3380. // if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  3381. include(regs,RS_R14);
  3382. { safely estimate stack size }
  3383. if localsize+current_settings.alignment.localalignmax+4>508 then
  3384. begin
  3385. include(rg[R_INTREGISTER].used_in_proc,RS_R4);
  3386. include(regs,RS_R4);
  3387. end;
  3388. registerarea:=0;
  3389. if regs<>[] then
  3390. begin
  3391. for r:=RS_R0 to RS_R15 do
  3392. if r in regs then
  3393. inc(registerarea,4);
  3394. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,regs));
  3395. end;
  3396. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3397. if stack_parameters or (LocalSize<>0) or
  3398. ((stackmisalignment<>0) and
  3399. ((pi_do_call in current_procinfo.flags) or
  3400. (po_assembler in current_procinfo.procdef.procoptions))) then
  3401. begin
  3402. { do we access stack parameters?
  3403. if yes, the previously estimated stacksize must be used }
  3404. if stack_parameters then
  3405. begin
  3406. if localsize>tarmprocinfo(current_procinfo).stackframesize then
  3407. begin
  3408. writeln(localsize);
  3409. writeln(tarmprocinfo(current_procinfo).stackframesize);
  3410. internalerror(2013040601);
  3411. end
  3412. else
  3413. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea;
  3414. end
  3415. else
  3416. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3417. if localsize<508 then
  3418. begin
  3419. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  3420. end
  3421. else if localsize<=1016 then
  3422. begin
  3423. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3424. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize-508));
  3425. end
  3426. else
  3427. begin
  3428. a_load_const_reg(list,OS_ADDR,-localsize,NR_R4);
  3429. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R4));
  3430. include(regs,RS_R4);
  3431. //!!!! if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  3432. //!!!! a_reg_alloc(list,NR_R12);
  3433. //!!!! a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  3434. //!!!! list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  3435. //!!!! a_reg_dealloc(list,NR_R12);
  3436. end;
  3437. end;
  3438. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3439. begin
  3440. list.concat(taicpu.op_reg_reg_const(A_ADD,current_procinfo.framepointer,NR_STACK_POINTER_REG,0));
  3441. end;
  3442. end;
  3443. end;
  3444. procedure tthumbcgarm.g_proc_exit(list: TAsmList; parasize: longint; nostackframe: boolean);
  3445. var
  3446. ref : treference;
  3447. LocalSize : longint;
  3448. r,
  3449. shift : byte;
  3450. saveregs,
  3451. regs : tcpuregisterset;
  3452. registerarea : DWord;
  3453. stackmisalignment: pint;
  3454. imm1, imm2: DWord;
  3455. stack_parameters : Boolean;
  3456. begin
  3457. if not(nostackframe) then
  3458. begin
  3459. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3460. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3461. include(regs,RS_R15);
  3462. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3463. include(regs,getsupreg(current_procinfo.framepointer));
  3464. registerarea:=0;
  3465. for r:=RS_R0 to RS_R15 do
  3466. if r in regs then
  3467. inc(registerarea,4);
  3468. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3469. LocalSize:=current_procinfo.calc_stackframe_size;
  3470. if stack_parameters then
  3471. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea
  3472. else
  3473. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3474. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  3475. (target_info.system in systems_darwin) then
  3476. begin
  3477. if (LocalSize<>0) or
  3478. ((stackmisalignment<>0) and
  3479. ((pi_do_call in current_procinfo.flags) or
  3480. (po_assembler in current_procinfo.procdef.procoptions))) then
  3481. begin
  3482. if LocalSize=0 then
  3483. else if LocalSize<=508 then
  3484. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  3485. else if LocalSize<=1016 then
  3486. begin
  3487. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3488. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,localsize-508));
  3489. end
  3490. else
  3491. begin
  3492. a_reg_alloc(list,NR_R3);
  3493. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R3);
  3494. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R3));
  3495. a_reg_dealloc(list,NR_R3);
  3496. end;
  3497. end;
  3498. if regs=[] then
  3499. begin
  3500. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3501. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3502. else
  3503. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3504. end
  3505. else
  3506. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,regs));
  3507. end;
  3508. end
  3509. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3510. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3511. else
  3512. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3513. end;
  3514. procedure tthumbcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3515. var
  3516. oppostfix:toppostfix;
  3517. usedtmpref: treference;
  3518. tmpreg,tmpreg2 : tregister;
  3519. dir : integer;
  3520. begin
  3521. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3522. FromSize := ToSize;
  3523. case FromSize of
  3524. { signed integer registers }
  3525. OS_8:
  3526. oppostfix:=PF_B;
  3527. OS_S8:
  3528. oppostfix:=PF_SB;
  3529. OS_16:
  3530. oppostfix:=PF_H;
  3531. OS_S16:
  3532. oppostfix:=PF_SH;
  3533. OS_32,
  3534. OS_S32:
  3535. oppostfix:=PF_None;
  3536. else
  3537. InternalError(200308298);
  3538. end;
  3539. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3540. begin
  3541. if target_info.endian=endian_big then
  3542. dir:=-1
  3543. else
  3544. dir:=1;
  3545. case FromSize of
  3546. OS_16,OS_S16:
  3547. begin
  3548. { only complicated references need an extra loadaddr }
  3549. if assigned(ref.symbol) or
  3550. (ref.index<>NR_NO) or
  3551. (ref.offset<-124) or
  3552. (ref.offset>124) or
  3553. { sometimes the compiler reused registers }
  3554. (reg=ref.index) or
  3555. (reg=ref.base) then
  3556. begin
  3557. tmpreg2:=getintregister(list,OS_INT);
  3558. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3559. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3560. end
  3561. else
  3562. usedtmpref:=ref;
  3563. if target_info.endian=endian_big then
  3564. inc(usedtmpref.offset,1);
  3565. tmpreg:=getintregister(list,OS_INT);
  3566. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3567. inc(usedtmpref.offset,dir);
  3568. if FromSize=OS_16 then
  3569. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3570. else
  3571. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3572. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3573. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3574. end;
  3575. OS_32,OS_S32:
  3576. begin
  3577. tmpreg:=getintregister(list,OS_INT);
  3578. { only complicated references need an extra loadaddr }
  3579. if assigned(ref.symbol) or
  3580. (ref.index<>NR_NO) or
  3581. (ref.offset<-124) or
  3582. (ref.offset>124) or
  3583. { sometimes the compiler reused registers }
  3584. (reg=ref.index) or
  3585. (reg=ref.base) then
  3586. begin
  3587. tmpreg2:=getintregister(list,OS_INT);
  3588. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3589. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3590. end
  3591. else
  3592. usedtmpref:=ref;
  3593. if ref.alignment=2 then
  3594. begin
  3595. if target_info.endian=endian_big then
  3596. inc(usedtmpref.offset,2);
  3597. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  3598. inc(usedtmpref.offset,dir*2);
  3599. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  3600. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3601. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3602. end
  3603. else
  3604. begin
  3605. if target_info.endian=endian_big then
  3606. inc(usedtmpref.offset,3);
  3607. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3608. inc(usedtmpref.offset,dir);
  3609. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3610. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3611. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3612. inc(usedtmpref.offset,dir);
  3613. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3614. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3615. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3616. inc(usedtmpref.offset,dir);
  3617. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3618. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,24));
  3619. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3620. end;
  3621. end
  3622. else
  3623. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3624. end;
  3625. end
  3626. else
  3627. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3628. if (fromsize=OS_S8) and (tosize = OS_16) then
  3629. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  3630. end;
  3631. procedure tthumbcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3632. var
  3633. imm_shift : byte;
  3634. l : tasmlabel;
  3635. hr : treference;
  3636. begin
  3637. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3638. internalerror(2002090902);
  3639. if is_thumb_imm(a) then
  3640. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3641. else
  3642. begin
  3643. reference_reset(hr,4);
  3644. current_asmdata.getjumplabel(l);
  3645. cg.a_label(current_procinfo.aktlocaldata,l);
  3646. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3647. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3648. hr.symbol:=l;
  3649. hr.base:=NR_PC;
  3650. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3651. end;
  3652. end;
  3653. procedure tthumbcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  3654. var
  3655. hsym : tsym;
  3656. href,
  3657. tmpref : treference;
  3658. paraloc : Pcgparalocation;
  3659. l : TAsmLabel;
  3660. begin
  3661. { calculate the parameter info for the procdef }
  3662. procdef.init_paraloc_info(callerside);
  3663. hsym:=tsym(procdef.parast.Find('self'));
  3664. if not(assigned(hsym) and
  3665. (hsym.typ=paravarsym)) then
  3666. internalerror(200305251);
  3667. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  3668. while paraloc<>nil do
  3669. with paraloc^ do
  3670. begin
  3671. case loc of
  3672. LOC_REGISTER:
  3673. begin
  3674. if is_thumb_imm(ioffset) then
  3675. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  3676. else
  3677. begin
  3678. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3679. reference_reset(tmpref,4);
  3680. current_asmdata.getjumplabel(l);
  3681. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3682. cg.a_label(current_procinfo.aktlocaldata,l);
  3683. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3684. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3685. tmpref.symbol:=l;
  3686. tmpref.base:=NR_PC;
  3687. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3688. a_op_reg_reg(list,OP_SUB,size,NR_R4,register);
  3689. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3690. end;
  3691. end;
  3692. LOC_REFERENCE:
  3693. begin
  3694. { offset in the wrapper needs to be adjusted for the stored
  3695. return address }
  3696. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),sizeof(pint));
  3697. if is_thumb_imm(ioffset) then
  3698. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  3699. else
  3700. begin
  3701. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3702. reference_reset(tmpref,4);
  3703. current_asmdata.getjumplabel(l);
  3704. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3705. cg.a_label(current_procinfo.aktlocaldata,l);
  3706. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3707. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3708. tmpref.symbol:=l;
  3709. tmpref.base:=NR_PC;
  3710. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3711. a_op_reg_ref(list,OP_SUB,size,NR_R4,href);
  3712. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3713. end;
  3714. end
  3715. else
  3716. internalerror(200309189);
  3717. end;
  3718. paraloc:=next;
  3719. end;
  3720. end;
  3721. function tthumbcgarm.handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference;
  3722. var
  3723. href : treference;
  3724. tmpreg : TRegister;
  3725. begin
  3726. href:=ref;
  3727. if { LDR/STR limitations }
  3728. (
  3729. (((op=A_LDR) and (oppostfix=PF_None)) or
  3730. ((op=A_STR) and (oppostfix=PF_None))) and
  3731. (ref.base<>NR_STACK_POINTER_REG) and
  3732. (abs(ref.offset)>124)
  3733. ) or
  3734. { LDRB/STRB limitations }
  3735. (
  3736. (((op=A_LDR) and (oppostfix=PF_B)) or
  3737. ((op=A_LDRB) and (oppostfix=PF_None)) or
  3738. ((op=A_STR) and (oppostfix=PF_B)) or
  3739. ((op=A_STRB) and (oppostfix=PF_None))) and
  3740. ((ref.base=NR_STACK_POINTER_REG) or
  3741. (ref.index=NR_STACK_POINTER_REG) or
  3742. (abs(ref.offset)>31)
  3743. )
  3744. ) or
  3745. { LDRH/STRH limitations }
  3746. (
  3747. (((op=A_LDR) and (oppostfix=PF_H)) or
  3748. ((op=A_LDRH) and (oppostfix=PF_None)) or
  3749. ((op=A_STR) and (oppostfix=PF_H)) or
  3750. ((op=A_STRH) and (oppostfix=PF_None))) and
  3751. ((ref.base=NR_STACK_POINTER_REG) or
  3752. (ref.index=NR_STACK_POINTER_REG) or
  3753. (abs(ref.offset)>62) or
  3754. ((abs(ref.offset) mod 2)<>0)
  3755. )
  3756. ) then
  3757. begin
  3758. tmpreg:=getintregister(list,OS_ADDR);
  3759. a_loadaddr_ref_reg(list,ref,tmpreg);
  3760. reference_reset_base(href,tmpreg,0,ref.alignment);
  3761. end
  3762. else if (op=A_LDR) and
  3763. (oppostfix in [PF_None]) and
  3764. (ref.base=NR_STACK_POINTER_REG) and
  3765. (abs(ref.offset)>1020) then
  3766. begin
  3767. tmpreg:=getintregister(list,OS_ADDR);
  3768. a_loadaddr_ref_reg(list,ref,tmpreg);
  3769. reference_reset_base(href,tmpreg,0,ref.alignment);
  3770. end
  3771. else if (op=A_LDR) and
  3772. ((oppostfix in [PF_SH,PF_SB]) or
  3773. (abs(ref.offset)>124)) then
  3774. begin
  3775. tmpreg:=getintregister(list,OS_ADDR);
  3776. a_loadaddr_ref_reg(list,ref,tmpreg);
  3777. reference_reset_base(href,tmpreg,0,ref.alignment);
  3778. end;
  3779. Result:=inherited handle_load_store(list, op, oppostfix, reg, href);
  3780. end;
  3781. procedure tthumbcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  3782. var
  3783. tmpreg,overflowreg : tregister;
  3784. asmop : tasmop;
  3785. begin
  3786. case op of
  3787. OP_NEG:
  3788. list.concat(taicpu.op_reg_reg(A_NEG,dst,src));
  3789. OP_NOT:
  3790. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  3791. OP_DIV,OP_IDIV:
  3792. internalerror(200308284);
  3793. OP_ROL:
  3794. begin
  3795. if not(size in [OS_32,OS_S32]) then
  3796. internalerror(2008072801);
  3797. { simulate ROL by ror'ing 32-value }
  3798. tmpreg:=getintregister(list,OS_32);
  3799. a_load_const_reg(list,OS_32,32,tmpreg);
  3800. list.concat(taicpu.op_reg_reg(A_SUB,tmpreg,src));
  3801. list.concat(taicpu.op_reg_reg(A_ROR,dst,src));
  3802. end;
  3803. else
  3804. begin
  3805. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3806. list.concat(setoppostfix(
  3807. taicpu.op_reg_reg(op_reg_opcg2asmop[op],dst,src),op_reg_postfix[op]));
  3808. end;
  3809. end;
  3810. maybeadjustresult(list,op,size,dst);
  3811. end;
  3812. procedure tthumbcgarm.a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);
  3813. var
  3814. tmpreg : tregister;
  3815. so : tshifterop;
  3816. l1 : longint;
  3817. imm1, imm2: DWord;
  3818. begin
  3819. //!!! ovloc.loc:=LOC_VOID;
  3820. if {$ifopt R+}(a<>-2147483648) and{$endif} {!!!!!! not setflags and } is_thumb_imm(-a) then
  3821. case op of
  3822. OP_ADD:
  3823. begin
  3824. op:=OP_SUB;
  3825. a:=aint(dword(-a));
  3826. end;
  3827. OP_SUB:
  3828. begin
  3829. op:=OP_ADD;
  3830. a:=aint(dword(-a));
  3831. end
  3832. end;
  3833. if is_thumb_imm(a) and (op in [OP_ADD,OP_SUB]) then
  3834. begin
  3835. // if cgsetflags or setflags then
  3836. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3837. list.concat(setoppostfix(
  3838. taicpu.op_reg_const(op_reg_opcg2asmop[op],dst,a),op_reg_postfix[op]));
  3839. if (cgsetflags {!!! or setflags }) and (size in [OS_8,OS_16,OS_32]) then
  3840. begin
  3841. //!!! ovloc.loc:=LOC_FLAGS;
  3842. case op of
  3843. OP_ADD:
  3844. //!!! ovloc.resflags:=F_CS;
  3845. ;
  3846. OP_SUB:
  3847. //!!! ovloc.resflags:=F_CC;
  3848. ;
  3849. end;
  3850. end;
  3851. end
  3852. else
  3853. begin
  3854. { there could be added some more sophisticated optimizations }
  3855. if (op in [OP_MUL,OP_IMUL,OP_DIV,OP_IDIV]) and (a=1) then
  3856. a_load_reg_reg(list,size,size,dst,dst)
  3857. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  3858. a_load_const_reg(list,size,0,dst)
  3859. else if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  3860. a_op_reg_reg(list,OP_NEG,size,dst,dst)
  3861. { we do this here instead in the peephole optimizer because
  3862. it saves us a register }
  3863. {$ifdef DUMMY}
  3864. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  3865. a_op_const_reg_reg(list,OP_SHL,size,l1,dst,dst)
  3866. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  3867. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  3868. begin
  3869. if l1>32 then{roozbeh does this ever happen?}
  3870. internalerror(200308296);
  3871. shifterop_reset(so);
  3872. so.shiftmode:=SM_LSL;
  3873. so.shiftimm:=l1;
  3874. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,dst,so));
  3875. end
  3876. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  3877. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  3878. begin
  3879. if l1>32 then{does this ever happen?}
  3880. internalerror(201205181);
  3881. shifterop_reset(so);
  3882. so.shiftmode:=SM_LSL;
  3883. so.shiftimm:=l1;
  3884. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,dst,dst,so));
  3885. end
  3886. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,dst,dst) then
  3887. begin
  3888. { nothing to do on success }
  3889. end
  3890. {$endif DUMMY}
  3891. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  3892. Just using mov x, #0 might allow some easier optimizations down the line. }
  3893. else if (op = OP_AND) and (dword(a)=0) then
  3894. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  3895. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  3896. else if (op = OP_AND) and (not(dword(a))=0) then
  3897. // do nothing
  3898. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  3899. broader range of shifterconstants.}
  3900. {$ifdef DUMMY}
  3901. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  3902. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,not(dword(a))))
  3903. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  3904. begin
  3905. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm1));
  3906. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  3907. end
  3908. else if (op in [OP_ADD, OP_SUB, OP_OR]) and
  3909. not(cgsetflags or setflags) and
  3910. split_into_shifter_const(a, imm1, imm2) then
  3911. begin
  3912. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm1));
  3913. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  3914. end
  3915. {$endif DUMMY}
  3916. else if (op in [OP_SHL, OP_SHR, OP_SAR]) then
  3917. begin
  3918. list.concat(taicpu.op_reg_reg_const(op_reg_opcg2asmop[op],dst,dst,a));
  3919. end
  3920. else
  3921. begin
  3922. tmpreg:=getintregister(list,size);
  3923. a_load_const_reg(list,size,a,tmpreg);
  3924. a_op_reg_reg(list,op,size,tmpreg,dst);
  3925. end;
  3926. end;
  3927. maybeadjustresult(list,op,size,dst);
  3928. end;
  3929. procedure tthumbcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister);
  3930. begin
  3931. if (op=OP_ADD) and (src=NR_R13) and (dst<>NR_R13) and ((a mod 4)=0) and (a>0) and (a<=1020) then
  3932. list.concat(taicpu.op_reg_reg_const(A_ADD,dst,src,a))
  3933. else
  3934. inherited a_op_const_reg_reg(list,op,size,a,src,dst);
  3935. end;
  3936. procedure tthumbcgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  3937. var
  3938. l1,l2 : tasmlabel;
  3939. ai : taicpu;
  3940. begin
  3941. current_asmdata.getjumplabel(l1);
  3942. current_asmdata.getjumplabel(l2);
  3943. ai:=setcondition(taicpu.op_sym(A_B,l1),flags_to_cond(f));
  3944. ai.is_jmp:=true;
  3945. list.concat(ai);
  3946. list.concat(taicpu.op_reg_const(A_MOV,reg,0));
  3947. list.concat(taicpu.op_sym(A_B,l2));
  3948. cg.a_label(list,l1);
  3949. list.concat(taicpu.op_reg_const(A_MOV,reg,1));
  3950. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3951. cg.a_label(list,l2);
  3952. end;
  3953. procedure tthumbcgarm.g_external_wrapper(list: TAsmList; procdef: tprocdef; const externalname: string);
  3954. var
  3955. tmpref : treference;
  3956. l : tasmlabel;
  3957. begin
  3958. { there is no branch instruction on thumb which allows big distances and which leaves LR as it is
  3959. and which allows to switch the instruction set }
  3960. { create const entry }
  3961. reference_reset(tmpref,4);
  3962. current_asmdata.getjumplabel(l);
  3963. tmpref.symbol:=l;
  3964. tmpref.base:=NR_PC;
  3965. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R0]));
  3966. list.concat(taicpu.op_reg_ref(A_LDR,NR_R0,tmpref));
  3967. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_R0));
  3968. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R0]));
  3969. list.concat(taicpu.op_reg(A_BX,NR_R12));
  3970. { append const entry }
  3971. list.Concat(tai_align.Create(4));
  3972. list.Concat(tai_label.create(l));
  3973. list.concat(tai_const.Create_sym(current_asmdata.RefAsmSymbol(externalname)));
  3974. end;
  3975. procedure tthumb2cgarm.init_register_allocators;
  3976. begin
  3977. inherited init_register_allocators;
  3978. { currently, we save R14 always, so we can use it }
  3979. if (target_info.system<>system_arm_darwin) then
  3980. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3981. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3982. RS_R9,RS_R10,RS_R12,RS_R14],first_int_imreg,[])
  3983. else
  3984. { r9 is not available on Darwin according to the llvm code generator }
  3985. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3986. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3987. RS_R10,RS_R12,RS_R14],first_int_imreg,[]);
  3988. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  3989. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  3990. if current_settings.fputype=fpu_vfpv3 then
  3991. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3992. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3993. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  3994. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3995. ],first_mm_imreg,[])
  3996. else if current_settings.fputype in [fpu_fpv4_s16,fpu_vfpv3_d16] then
  3997. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3998. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3999. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  4000. ],first_mm_imreg,[])
  4001. else
  4002. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBNONE,
  4003. [RS_S0,RS_S1,RS_R2,RS_R3,RS_R4,RS_S31],first_mm_imreg,[]);
  4004. end;
  4005. procedure tthumb2cgarm.done_register_allocators;
  4006. begin
  4007. rg[R_INTREGISTER].free;
  4008. rg[R_FPUREGISTER].free;
  4009. rg[R_MMREGISTER].free;
  4010. inherited done_register_allocators;
  4011. end;
  4012. procedure tthumb2cgarm.a_call_reg(list : TAsmList;reg: tregister);
  4013. begin
  4014. list.concat(taicpu.op_reg(A_BLX, reg));
  4015. {
  4016. the compiler does not properly set this flag anymore in pass 1, and
  4017. for now we only need it after pass 2 (I hope) (JM)
  4018. if not(pi_do_call in current_procinfo.flags) then
  4019. internalerror(2003060703);
  4020. }
  4021. include(current_procinfo.flags,pi_do_call);
  4022. end;
  4023. procedure tthumb2cgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  4024. var
  4025. imm_shift : byte;
  4026. l : tasmlabel;
  4027. hr : treference;
  4028. begin
  4029. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  4030. internalerror(2002090902);
  4031. if is_thumb32_imm(a) then
  4032. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  4033. else if is_thumb32_imm(not(a)) then
  4034. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  4035. else if (a and $FFFF)=a then
  4036. list.concat(taicpu.op_reg_const(A_MOVW,reg,a))
  4037. else
  4038. begin
  4039. reference_reset(hr,4);
  4040. current_asmdata.getjumplabel(l);
  4041. cg.a_label(current_procinfo.aktlocaldata,l);
  4042. hr.symboldata:=current_procinfo.aktlocaldata.last;
  4043. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  4044. hr.symbol:=l;
  4045. hr.base:=NR_PC;
  4046. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  4047. end;
  4048. end;
  4049. procedure tthumb2cgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  4050. var
  4051. oppostfix:toppostfix;
  4052. usedtmpref: treference;
  4053. tmpreg,tmpreg2 : tregister;
  4054. so : tshifterop;
  4055. dir : integer;
  4056. begin
  4057. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  4058. FromSize := ToSize;
  4059. case FromSize of
  4060. { signed integer registers }
  4061. OS_8:
  4062. oppostfix:=PF_B;
  4063. OS_S8:
  4064. oppostfix:=PF_SB;
  4065. OS_16:
  4066. oppostfix:=PF_H;
  4067. OS_S16:
  4068. oppostfix:=PF_SH;
  4069. OS_32,
  4070. OS_S32:
  4071. oppostfix:=PF_None;
  4072. else
  4073. InternalError(200308299);
  4074. end;
  4075. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  4076. begin
  4077. if target_info.endian=endian_big then
  4078. dir:=-1
  4079. else
  4080. dir:=1;
  4081. case FromSize of
  4082. OS_16,OS_S16:
  4083. begin
  4084. { only complicated references need an extra loadaddr }
  4085. if assigned(ref.symbol) or
  4086. (ref.index<>NR_NO) or
  4087. (ref.offset<-255) or
  4088. (ref.offset>4094) or
  4089. { sometimes the compiler reused registers }
  4090. (reg=ref.index) or
  4091. (reg=ref.base) then
  4092. begin
  4093. tmpreg2:=getintregister(list,OS_INT);
  4094. a_loadaddr_ref_reg(list,ref,tmpreg2);
  4095. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  4096. end
  4097. else
  4098. usedtmpref:=ref;
  4099. if target_info.endian=endian_big then
  4100. inc(usedtmpref.offset,1);
  4101. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  4102. tmpreg:=getintregister(list,OS_INT);
  4103. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  4104. inc(usedtmpref.offset,dir);
  4105. if FromSize=OS_16 then
  4106. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  4107. else
  4108. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  4109. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4110. end;
  4111. OS_32,OS_S32:
  4112. begin
  4113. tmpreg:=getintregister(list,OS_INT);
  4114. { only complicated references need an extra loadaddr }
  4115. if assigned(ref.symbol) or
  4116. (ref.index<>NR_NO) or
  4117. (ref.offset<-255) or
  4118. (ref.offset>4092) or
  4119. { sometimes the compiler reused registers }
  4120. (reg=ref.index) or
  4121. (reg=ref.base) then
  4122. begin
  4123. tmpreg2:=getintregister(list,OS_INT);
  4124. a_loadaddr_ref_reg(list,ref,tmpreg2);
  4125. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  4126. end
  4127. else
  4128. usedtmpref:=ref;
  4129. shifterop_reset(so);so.shiftmode:=SM_LSL;
  4130. if ref.alignment=2 then
  4131. begin
  4132. if target_info.endian=endian_big then
  4133. inc(usedtmpref.offset,2);
  4134. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  4135. inc(usedtmpref.offset,dir*2);
  4136. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  4137. so.shiftimm:=16;
  4138. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4139. end
  4140. else
  4141. begin
  4142. if target_info.endian=endian_big then
  4143. inc(usedtmpref.offset,3);
  4144. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  4145. inc(usedtmpref.offset,dir);
  4146. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4147. so.shiftimm:=8;
  4148. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4149. inc(usedtmpref.offset,dir);
  4150. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4151. so.shiftimm:=16;
  4152. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4153. inc(usedtmpref.offset,dir);
  4154. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4155. so.shiftimm:=24;
  4156. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4157. end;
  4158. end
  4159. else
  4160. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4161. end;
  4162. end
  4163. else
  4164. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4165. if (fromsize=OS_S8) and (tosize = OS_16) then
  4166. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  4167. end;
  4168. procedure tthumb2cgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  4169. begin
  4170. if op = OP_NOT then
  4171. begin
  4172. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  4173. case size of
  4174. OS_8: list.concat(taicpu.op_reg_reg(A_UXTB,dst,dst));
  4175. OS_S8: list.concat(taicpu.op_reg_reg(A_SXTB,dst,dst));
  4176. OS_16: list.concat(taicpu.op_reg_reg(A_UXTH,dst,dst));
  4177. OS_S16: list.concat(taicpu.op_reg_reg(A_SXTH,dst,dst));
  4178. end;
  4179. end
  4180. else
  4181. inherited a_op_reg_reg(list, op, size, src, dst);
  4182. end;
  4183. procedure tthumb2cgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4184. var
  4185. shift, width : byte;
  4186. tmpreg : tregister;
  4187. so : tshifterop;
  4188. l1 : longint;
  4189. begin
  4190. ovloc.loc:=LOC_VOID;
  4191. if {$ifopt R+}(a<>-2147483648) and{$endif} is_shifter_const(-a,shift) then
  4192. case op of
  4193. OP_ADD:
  4194. begin
  4195. op:=OP_SUB;
  4196. a:=aint(dword(-a));
  4197. end;
  4198. OP_SUB:
  4199. begin
  4200. op:=OP_ADD;
  4201. a:=aint(dword(-a));
  4202. end
  4203. end;
  4204. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  4205. case op of
  4206. OP_NEG,OP_NOT,
  4207. OP_DIV,OP_IDIV:
  4208. internalerror(200308285);
  4209. OP_SHL:
  4210. begin
  4211. if a>32 then
  4212. internalerror(2014020703);
  4213. if a<>0 then
  4214. begin
  4215. shifterop_reset(so);
  4216. so.shiftmode:=SM_LSL;
  4217. so.shiftimm:=a;
  4218. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4219. end
  4220. else
  4221. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4222. end;
  4223. OP_ROL:
  4224. begin
  4225. if a>32 then
  4226. internalerror(2014020704);
  4227. if a<>0 then
  4228. begin
  4229. shifterop_reset(so);
  4230. so.shiftmode:=SM_ROR;
  4231. so.shiftimm:=32-a;
  4232. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4233. end
  4234. else
  4235. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4236. end;
  4237. OP_ROR:
  4238. begin
  4239. if a>32 then
  4240. internalerror(2014020705);
  4241. if a<>0 then
  4242. begin
  4243. shifterop_reset(so);
  4244. so.shiftmode:=SM_ROR;
  4245. so.shiftimm:=a;
  4246. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4247. end
  4248. else
  4249. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4250. end;
  4251. OP_SHR:
  4252. begin
  4253. if a>32 then
  4254. internalerror(200308292);
  4255. shifterop_reset(so);
  4256. if a<>0 then
  4257. begin
  4258. so.shiftmode:=SM_LSR;
  4259. so.shiftimm:=a;
  4260. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4261. end
  4262. else
  4263. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4264. end;
  4265. OP_SAR:
  4266. begin
  4267. if a>32 then
  4268. internalerror(200308295);
  4269. if a<>0 then
  4270. begin
  4271. shifterop_reset(so);
  4272. so.shiftmode:=SM_ASR;
  4273. so.shiftimm:=a;
  4274. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4275. end
  4276. else
  4277. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4278. end;
  4279. else
  4280. if (op in [OP_SUB, OP_ADD]) and
  4281. ((a < 0) or
  4282. (a > 4095)) then
  4283. begin
  4284. tmpreg:=getintregister(list,size);
  4285. a_load_const_reg(list, size, a, tmpreg);
  4286. if cgsetflags or setflags then
  4287. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4288. list.concat(setoppostfix(
  4289. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4290. end
  4291. else
  4292. begin
  4293. if cgsetflags or setflags then
  4294. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4295. list.concat(setoppostfix(
  4296. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4297. end;
  4298. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  4299. begin
  4300. ovloc.loc:=LOC_FLAGS;
  4301. case op of
  4302. OP_ADD:
  4303. ovloc.resflags:=F_CS;
  4304. OP_SUB:
  4305. ovloc.resflags:=F_CC;
  4306. end;
  4307. end;
  4308. end
  4309. else
  4310. begin
  4311. { there could be added some more sophisticated optimizations }
  4312. if (op in [OP_MUL,OP_IMUL]) and (a=1) then
  4313. a_load_reg_reg(list,size,size,src,dst)
  4314. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  4315. a_load_const_reg(list,size,0,dst)
  4316. else if (op in [OP_IMUL]) and (a=-1) then
  4317. a_op_reg_reg(list,OP_NEG,size,src,dst)
  4318. { we do this here instead in the peephole optimizer because
  4319. it saves us a register }
  4320. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  4321. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  4322. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  4323. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  4324. begin
  4325. if l1>32 then{roozbeh does this ever happen?}
  4326. internalerror(200308296);
  4327. shifterop_reset(so);
  4328. so.shiftmode:=SM_LSL;
  4329. so.shiftimm:=l1;
  4330. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  4331. end
  4332. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  4333. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  4334. begin
  4335. if l1>32 then{does this ever happen?}
  4336. internalerror(201205181);
  4337. shifterop_reset(so);
  4338. so.shiftmode:=SM_LSL;
  4339. so.shiftimm:=l1;
  4340. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  4341. end
  4342. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  4343. begin
  4344. { nothing to do on success }
  4345. end
  4346. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  4347. Just using mov x, #0 might allow some easier optimizations down the line. }
  4348. else if (op = OP_AND) and (dword(a)=0) then
  4349. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  4350. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  4351. else if (op = OP_AND) and (not(dword(a))=0) then
  4352. list.concat(taicpu.op_reg_reg(A_MOV,dst,src))
  4353. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  4354. broader range of shifterconstants.}
  4355. {else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  4356. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))}
  4357. else if (op = OP_AND) and is_thumb32_imm(a) then
  4358. list.concat(taicpu.op_reg_reg_const(A_AND,dst,src,dword(a)))
  4359. else if (op = OP_AND) and (a = $FFFF) then
  4360. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  4361. else if (op = OP_AND) and is_thumb32_imm(not(dword(a))) then
  4362. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  4363. else if (op = OP_AND) and is_continuous_mask(not(a), shift, width) then
  4364. begin
  4365. a_load_reg_reg(list,size,size,src,dst);
  4366. list.concat(taicpu.op_reg_const_const(A_BFC,dst,shift,width))
  4367. end
  4368. else
  4369. begin
  4370. tmpreg:=getintregister(list,size);
  4371. a_load_const_reg(list,size,a,tmpreg);
  4372. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  4373. end;
  4374. end;
  4375. maybeadjustresult(list,op,size,dst);
  4376. end;
  4377. const
  4378. op_reg_reg_opcg2asmopThumb2: array[TOpCG] of tasmop =
  4379. (A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NONE,A_MVN,A_ORR,
  4380. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  4381. procedure tthumb2cgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4382. var
  4383. so : tshifterop;
  4384. tmpreg,overflowreg : tregister;
  4385. asmop : tasmop;
  4386. begin
  4387. ovloc.loc:=LOC_VOID;
  4388. case op of
  4389. OP_NEG,OP_NOT:
  4390. internalerror(200308286);
  4391. OP_ROL:
  4392. begin
  4393. if not(size in [OS_32,OS_S32]) then
  4394. internalerror(2008072801);
  4395. { simulate ROL by ror'ing 32-value }
  4396. tmpreg:=getintregister(list,OS_32);
  4397. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,32));
  4398. list.concat(taicpu.op_reg_reg_reg(A_SUB,src1,tmpreg,src1));
  4399. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4400. end;
  4401. OP_ROR:
  4402. begin
  4403. if not(size in [OS_32,OS_S32]) then
  4404. internalerror(2008072802);
  4405. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4406. end;
  4407. OP_IMUL,
  4408. OP_MUL:
  4409. begin
  4410. if cgsetflags or setflags then
  4411. begin
  4412. overflowreg:=getintregister(list,size);
  4413. if op=OP_IMUL then
  4414. asmop:=A_SMULL
  4415. else
  4416. asmop:=A_UMULL;
  4417. { the arm doesn't allow that rd and rm are the same }
  4418. if dst=src2 then
  4419. begin
  4420. if dst<>src1 then
  4421. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  4422. else
  4423. begin
  4424. tmpreg:=getintregister(list,size);
  4425. a_load_reg_reg(list,size,size,src2,dst);
  4426. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  4427. end;
  4428. end
  4429. else
  4430. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  4431. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4432. if op=OP_IMUL then
  4433. begin
  4434. shifterop_reset(so);
  4435. so.shiftmode:=SM_ASR;
  4436. so.shiftimm:=31;
  4437. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  4438. end
  4439. else
  4440. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  4441. ovloc.loc:=LOC_FLAGS;
  4442. ovloc.resflags:=F_NE;
  4443. end
  4444. else
  4445. begin
  4446. { the arm doesn't allow that rd and rm are the same }
  4447. if dst=src2 then
  4448. begin
  4449. if dst<>src1 then
  4450. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  4451. else
  4452. begin
  4453. tmpreg:=getintregister(list,size);
  4454. a_load_reg_reg(list,size,size,src2,dst);
  4455. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  4456. end;
  4457. end
  4458. else
  4459. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  4460. end;
  4461. end;
  4462. else
  4463. begin
  4464. if cgsetflags or setflags then
  4465. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4466. {$ifdef dummy}
  4467. { R13 is not allowed for certain instruction operands }
  4468. if op_reg_reg_opcg2asmopThumb2[op] in [A_ADD,A_SUB,A_AND,A_BIC,A_EOR] then
  4469. begin
  4470. if getsupreg(dst)=RS_R13 then
  4471. begin
  4472. tmpreg:=getintregister(list,OS_INT);
  4473. a_load_reg_reg(list,OS_INT,OS_INT,dst,tmpreg);
  4474. dst:=tmpreg;
  4475. end;
  4476. if getsupreg(src1)=RS_R13 then
  4477. begin
  4478. tmpreg:=getintregister(list,OS_INT);
  4479. a_load_reg_reg(list,OS_INT,OS_INT,src1,tmpreg);
  4480. src1:=tmpreg;
  4481. end;
  4482. end;
  4483. {$endif}
  4484. list.concat(setoppostfix(
  4485. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmopThumb2[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4486. end;
  4487. end;
  4488. maybeadjustresult(list,op,size,dst);
  4489. end;
  4490. procedure tthumb2cgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  4491. var item: taicpu;
  4492. begin
  4493. list.concat(taicpu.op_cond(A_ITE, flags_to_cond(f)));
  4494. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  4495. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  4496. end;
  4497. procedure tthumb2cgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  4498. var
  4499. ref : treference;
  4500. shift : byte;
  4501. firstfloatreg,lastfloatreg,
  4502. r : byte;
  4503. regs : tcpuregisterset;
  4504. stackmisalignment: pint;
  4505. begin
  4506. LocalSize:=align(LocalSize,4);
  4507. { call instruction does not put anything on the stack }
  4508. stackmisalignment:=0;
  4509. if not(nostackframe) then
  4510. begin
  4511. firstfloatreg:=RS_NO;
  4512. lastfloatreg:=RS_NO;
  4513. { save floating point registers? }
  4514. for r:=RS_F0 to RS_F7 do
  4515. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4516. begin
  4517. if firstfloatreg=RS_NO then
  4518. firstfloatreg:=r;
  4519. lastfloatreg:=r;
  4520. inc(stackmisalignment,12);
  4521. end;
  4522. a_reg_alloc(list,NR_STACK_POINTER_REG);
  4523. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4524. begin
  4525. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  4526. a_reg_alloc(list,NR_R12);
  4527. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  4528. end;
  4529. { save int registers }
  4530. reference_reset(ref,4);
  4531. ref.index:=NR_STACK_POINTER_REG;
  4532. ref.addressmode:=AM_PREINDEXED;
  4533. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4534. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4535. regs:=regs+[RS_FRAME_POINTER_REG,RS_R14]
  4536. else if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  4537. include(regs,RS_R14);
  4538. if regs<>[] then
  4539. begin
  4540. for r:=RS_R0 to RS_R15 do
  4541. if (r in regs) then
  4542. inc(stackmisalignment,4);
  4543. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4544. end;
  4545. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4546. begin
  4547. { the framepointer now points to the saved R15, so the saved
  4548. framepointer is at R11-12 (for get_caller_frame) }
  4549. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  4550. a_reg_dealloc(list,NR_R12);
  4551. end;
  4552. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4553. if (LocalSize<>0) or
  4554. ((stackmisalignment<>0) and
  4555. ((pi_do_call in current_procinfo.flags) or
  4556. (po_assembler in current_procinfo.procdef.procoptions))) then
  4557. begin
  4558. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4559. if not(is_shifter_const(localsize,shift)) then
  4560. begin
  4561. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  4562. a_reg_alloc(list,NR_R12);
  4563. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4564. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  4565. a_reg_dealloc(list,NR_R12);
  4566. end
  4567. else
  4568. begin
  4569. a_reg_dealloc(list,NR_R12);
  4570. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  4571. end;
  4572. end;
  4573. if firstfloatreg<>RS_NO then
  4574. begin
  4575. reference_reset(ref,4);
  4576. if tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023 then
  4577. begin
  4578. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  4579. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4580. ref.base:=NR_R12;
  4581. end
  4582. else
  4583. begin
  4584. ref.base:=current_procinfo.framepointer;
  4585. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  4586. end;
  4587. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4588. lastfloatreg-firstfloatreg+1,ref));
  4589. end;
  4590. end;
  4591. end;
  4592. procedure tthumb2cgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  4593. var
  4594. ref : treference;
  4595. firstfloatreg,lastfloatreg,
  4596. r : byte;
  4597. shift : byte;
  4598. regs : tcpuregisterset;
  4599. LocalSize : longint;
  4600. stackmisalignment: pint;
  4601. begin
  4602. if not(nostackframe) then
  4603. begin
  4604. stackmisalignment:=0;
  4605. { restore floating point register }
  4606. firstfloatreg:=RS_NO;
  4607. lastfloatreg:=RS_NO;
  4608. { save floating point registers? }
  4609. for r:=RS_F0 to RS_F7 do
  4610. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4611. begin
  4612. if firstfloatreg=RS_NO then
  4613. firstfloatreg:=r;
  4614. lastfloatreg:=r;
  4615. { floating point register space is already included in
  4616. localsize below by calc_stackframe_size
  4617. inc(stackmisalignment,12);
  4618. }
  4619. end;
  4620. if firstfloatreg<>RS_NO then
  4621. begin
  4622. reference_reset(ref,4);
  4623. if tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023 then
  4624. begin
  4625. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  4626. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4627. ref.base:=NR_R12;
  4628. end
  4629. else
  4630. begin
  4631. ref.base:=current_procinfo.framepointer;
  4632. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  4633. end;
  4634. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4635. lastfloatreg-firstfloatreg+1,ref));
  4636. end;
  4637. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4638. if (pi_do_call in current_procinfo.flags) or (regs<>[]) then
  4639. begin
  4640. exclude(regs,RS_R14);
  4641. include(regs,RS_R15);
  4642. end;
  4643. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  4644. regs:=regs+[RS_FRAME_POINTER_REG,RS_R15];
  4645. for r:=RS_R0 to RS_R15 do
  4646. if (r in regs) then
  4647. inc(stackmisalignment,4);
  4648. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4649. LocalSize:=current_procinfo.calc_stackframe_size;
  4650. if (LocalSize<>0) or
  4651. ((stackmisalignment<>0) and
  4652. ((pi_do_call in current_procinfo.flags) or
  4653. (po_assembler in current_procinfo.procdef.procoptions))) then
  4654. begin
  4655. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4656. if not(is_shifter_const(LocalSize,shift)) then
  4657. begin
  4658. a_reg_alloc(list,NR_R12);
  4659. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4660. list.concat(taicpu.op_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_R12));
  4661. a_reg_dealloc(list,NR_R12);
  4662. end
  4663. else
  4664. begin
  4665. a_reg_dealloc(list,NR_R12);
  4666. list.concat(taicpu.op_reg_const(A_ADD,NR_STACK_POINTER_REG,LocalSize));
  4667. end;
  4668. end;
  4669. if regs=[] then
  4670. list.concat(taicpu.op_reg_reg(A_MOV,NR_R15,NR_R14))
  4671. else
  4672. begin
  4673. reference_reset(ref,4);
  4674. ref.index:=NR_STACK_POINTER_REG;
  4675. ref.addressmode:=AM_PREINDEXED;
  4676. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4677. end;
  4678. end
  4679. else
  4680. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14));
  4681. end;
  4682. function tthumb2cgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  4683. var
  4684. tmpreg : tregister;
  4685. tmpref : treference;
  4686. l : tasmlabel;
  4687. so: tshifterop;
  4688. begin
  4689. tmpreg:=NR_NO;
  4690. { Be sure to have a base register }
  4691. if (ref.base=NR_NO) then
  4692. begin
  4693. if ref.shiftmode<>SM_None then
  4694. internalerror(2014020706);
  4695. ref.base:=ref.index;
  4696. ref.index:=NR_NO;
  4697. end;
  4698. { absolute symbols can't be handled directly, we've to store the symbol reference
  4699. in the text segment and access it pc relative
  4700. For now, we assume that references where base or index equals to PC are already
  4701. relative, all other references are assumed to be absolute and thus they need
  4702. to be handled extra.
  4703. A proper solution would be to change refoptions to a set and store the information
  4704. if the symbol is absolute or relative there.
  4705. }
  4706. if (assigned(ref.symbol) and
  4707. not(is_pc(ref.base)) and
  4708. not(is_pc(ref.index))
  4709. ) or
  4710. { [#xxx] isn't a valid address operand }
  4711. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  4712. //(ref.offset<-4095) or
  4713. (ref.offset<-255) or
  4714. (ref.offset>4095) or
  4715. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  4716. ((ref.offset<-255) or
  4717. (ref.offset>255)
  4718. )
  4719. ) or
  4720. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  4721. ((ref.offset<-1020) or
  4722. (ref.offset>1020) or
  4723. ((abs(ref.offset) mod 4)<>0) or
  4724. { the usual pc relative symbol handling assumes possible offsets of +/- 4095 }
  4725. assigned(ref.symbol)
  4726. )
  4727. ) then
  4728. begin
  4729. reference_reset(tmpref,4);
  4730. { load symbol }
  4731. tmpreg:=getintregister(list,OS_INT);
  4732. if assigned(ref.symbol) then
  4733. begin
  4734. current_asmdata.getjumplabel(l);
  4735. cg.a_label(current_procinfo.aktlocaldata,l);
  4736. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  4737. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset));
  4738. { load consts entry }
  4739. tmpref.symbol:=l;
  4740. tmpref.base:=NR_R15;
  4741. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  4742. { in case of LDF/STF, we got rid of the NR_R15 }
  4743. if is_pc(ref.base) then
  4744. ref.base:=NR_NO;
  4745. if is_pc(ref.index) then
  4746. ref.index:=NR_NO;
  4747. end
  4748. else
  4749. a_load_const_reg(list,OS_ADDR,ref.offset,tmpreg);
  4750. if (ref.base<>NR_NO) then
  4751. begin
  4752. if ref.index<>NR_NO then
  4753. begin
  4754. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4755. ref.base:=tmpreg;
  4756. end
  4757. else
  4758. begin
  4759. ref.index:=tmpreg;
  4760. ref.shiftimm:=0;
  4761. ref.signindex:=1;
  4762. ref.shiftmode:=SM_None;
  4763. end;
  4764. end
  4765. else
  4766. ref.base:=tmpreg;
  4767. ref.offset:=0;
  4768. ref.symbol:=nil;
  4769. end;
  4770. if (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  4771. begin
  4772. if tmpreg<>NR_NO then
  4773. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg,tmpreg)
  4774. else
  4775. begin
  4776. tmpreg:=getintregister(list,OS_ADDR);
  4777. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg);
  4778. ref.base:=tmpreg;
  4779. end;
  4780. ref.offset:=0;
  4781. end;
  4782. { Hack? Thumb2 doesn't allow PC indexed addressing modes(although it does in the specification) }
  4783. if (ref.base=NR_R15) and (ref.index<>NR_NO) and (ref.shiftmode <> sm_none) then
  4784. begin
  4785. tmpreg:=getintregister(list,OS_ADDR);
  4786. list.concat(taicpu.op_reg_reg(A_MOV, tmpreg, NR_R15));
  4787. ref.base := tmpreg;
  4788. end;
  4789. { floating point operations have only limited references
  4790. we expect here, that a base is already set }
  4791. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  4792. begin
  4793. if ref.shiftmode<>SM_none then
  4794. internalerror(200309121);
  4795. if tmpreg<>NR_NO then
  4796. begin
  4797. if ref.base=tmpreg then
  4798. begin
  4799. if ref.signindex<0 then
  4800. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,tmpreg,ref.index))
  4801. else
  4802. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,tmpreg,ref.index));
  4803. ref.index:=NR_NO;
  4804. end
  4805. else
  4806. begin
  4807. if ref.index<>tmpreg then
  4808. internalerror(200403161);
  4809. if ref.signindex<0 then
  4810. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,ref.base,tmpreg))
  4811. else
  4812. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4813. ref.base:=tmpreg;
  4814. ref.index:=NR_NO;
  4815. end;
  4816. end
  4817. else
  4818. begin
  4819. tmpreg:=getintregister(list,OS_ADDR);
  4820. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));
  4821. ref.base:=tmpreg;
  4822. ref.index:=NR_NO;
  4823. end;
  4824. end;
  4825. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  4826. Result := ref;
  4827. end;
  4828. procedure tthumb2cgarm.a_loadmm_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister; shuffle: pmmshuffle);
  4829. var
  4830. instr: taicpu;
  4831. begin
  4832. if (fromsize=OS_F32) and
  4833. (tosize=OS_F32) then
  4834. begin
  4835. instr:=setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32);
  4836. list.Concat(instr);
  4837. add_move_instruction(instr);
  4838. end
  4839. else if (fromsize=OS_F64) and
  4840. (tosize=OS_F64) then
  4841. begin
  4842. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,tregister(longint(reg2)+1),tregister(longint(reg1)+1)), PF_F32));
  4843. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32));
  4844. end
  4845. else if (fromsize=OS_F32) and
  4846. (tosize=OS_F64) then
  4847. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VCVT,reg2,reg1), PF_F32))
  4848. begin
  4849. //list.concat(nil);
  4850. end;
  4851. end;
  4852. procedure tthumb2cgarm.a_loadmm_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  4853. begin
  4854. handle_load_store(list,A_VLDR,PF_None,reg,ref);
  4855. end;
  4856. procedure tthumb2cgarm.a_loadmm_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  4857. begin
  4858. handle_load_store(list,A_VSTR,PF_None,reg,ref);
  4859. end;
  4860. procedure tthumb2cgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize: tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  4861. begin
  4862. if //(shuffle=nil) and
  4863. (tosize=OS_F32) then
  4864. list.Concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg))
  4865. else
  4866. internalerror(2012100813);
  4867. end;
  4868. procedure tthumb2cgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize: tcgsize; mmreg, intreg: tregister; shuffle: pmmshuffle);
  4869. begin
  4870. if //(shuffle=nil) and
  4871. (fromsize=OS_F32) then
  4872. list.Concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg))
  4873. else
  4874. internalerror(2012100814);
  4875. end;
  4876. procedure tthumb2cg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  4877. var tmpreg: tregister;
  4878. begin
  4879. case op of
  4880. OP_NEG:
  4881. begin
  4882. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4883. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  4884. tmpreg:=cg.getintregister(list,OS_32);
  4885. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,0));
  4886. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,tmpreg,regsrc.reghi));
  4887. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4888. end;
  4889. else
  4890. inherited a_op64_reg_reg(list, op, size, regsrc, regdst);
  4891. end;
  4892. end;
  4893. procedure tthumbcg64farm.a_op64_reg_reg(list: TAsmList; op: TOpCG; size: tcgsize; regsrc, regdst: tregister64);
  4894. begin
  4895. case op of
  4896. OP_NEG:
  4897. begin
  4898. list.concat(taicpu.op_reg_const(A_MOV,regdst.reglo,0));
  4899. list.concat(taicpu.op_reg_const(A_MOV,regdst.reghi,0));
  4900. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4901. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4902. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4903. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4904. end;
  4905. OP_NOT:
  4906. begin
  4907. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  4908. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  4909. end;
  4910. OP_AND,OP_OR,OP_XOR:
  4911. begin
  4912. cg.a_op_reg_reg(list,op,OS_32,regsrc.reglo,regdst.reglo);
  4913. cg.a_op_reg_reg(list,op,OS_32,regsrc.reghi,regdst.reghi);
  4914. end;
  4915. OP_ADD:
  4916. begin
  4917. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4918. list.concat(taicpu.op_reg_reg(A_ADD,regdst.reglo,regsrc.reglo));
  4919. list.concat(taicpu.op_reg_reg(A_ADC,regdst.reghi,regsrc.reghi));
  4920. end;
  4921. OP_SUB:
  4922. begin
  4923. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4924. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4925. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4926. end;
  4927. else
  4928. internalerror(2003083101);
  4929. end;
  4930. end;
  4931. procedure tthumbcg64farm.a_op64_const_reg(list: TAsmList; op: TOpCG; size: tcgsize; value: int64; reg: tregister64);
  4932. var
  4933. tmpreg : tregister;
  4934. b : byte;
  4935. begin
  4936. case op of
  4937. OP_AND,OP_OR,OP_XOR:
  4938. begin
  4939. cg.a_op_const_reg(list,op,OS_32,aint(lo(value)),reg.reglo);
  4940. cg.a_op_const_reg(list,op,OS_32,aint(hi(value)),reg.reghi);
  4941. end;
  4942. OP_ADD:
  4943. begin
  4944. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4945. begin
  4946. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4947. list.concat(taicpu.op_reg_const(A_ADD,reg.reglo,aint(lo(value))));
  4948. end
  4949. else
  4950. begin
  4951. tmpreg:=cg.getintregister(list,OS_32);
  4952. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4953. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4954. list.concat(taicpu.op_reg_reg(A_ADD,reg.reglo,tmpreg));
  4955. end;
  4956. tmpreg:=cg.getintregister(list,OS_32);
  4957. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  4958. list.concat(taicpu.op_reg_reg(A_ADC,reg.reghi,tmpreg));
  4959. end;
  4960. OP_SUB:
  4961. begin
  4962. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4963. begin
  4964. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4965. list.concat(taicpu.op_reg_const(A_SUB,reg.reglo,aint(lo(value))))
  4966. end
  4967. else
  4968. begin
  4969. tmpreg:=cg.getintregister(list,OS_32);
  4970. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4971. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4972. list.concat(taicpu.op_reg_reg(A_SUB,reg.reglo,tmpreg));
  4973. end;
  4974. tmpreg:=cg.getintregister(list,OS_32);
  4975. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  4976. list.concat(taicpu.op_reg_reg(A_SBC,reg.reghi,tmpreg));
  4977. end;
  4978. else
  4979. internalerror(2003083101);
  4980. end;
  4981. end;
  4982. procedure create_codegen;
  4983. begin
  4984. if GenerateThumb2Code then
  4985. begin
  4986. cg:=tthumb2cgarm.create;
  4987. cg64:=tthumb2cg64farm.create;
  4988. casmoptimizer:=TCpuThumb2AsmOptimizer;
  4989. end
  4990. else if GenerateThumbCode then
  4991. begin
  4992. cg:=tthumbcgarm.create;
  4993. cg64:=tthumbcg64farm.create;
  4994. // casmoptimizer:=TCpuThumbAsmOptimizer;
  4995. end
  4996. else
  4997. begin
  4998. cg:=tarmcgarm.create;
  4999. cg64:=tarmcg64farm.create;
  5000. casmoptimizer:=TCpuAsmOptimizer;
  5001. end;
  5002. end;
  5003. end.