cgcpu.pas 213 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889389038913892389338943895389638973898389939003901390239033904390539063907390839093910391139123913391439153916391739183919392039213922392339243925392639273928392939303931393239333934393539363937393839393940394139423943394439453946394739483949395039513952395339543955395639573958395939603961396239633964396539663967396839693970397139723973397439753976397739783979398039813982398339843985398639873988398939903991399239933994399539963997399839994000400140024003400440054006400740084009401040114012401340144015401640174018401940204021402240234024402540264027402840294030403140324033403440354036403740384039404040414042404340444045404640474048404940504051405240534054405540564057405840594060406140624063406440654066406740684069407040714072407340744075407640774078407940804081408240834084408540864087408840894090409140924093409440954096409740984099410041014102410341044105410641074108410941104111411241134114411541164117411841194120412141224123412441254126412741284129413041314132413341344135413641374138413941404141414241434144414541464147414841494150415141524153415441554156415741584159416041614162416341644165416641674168416941704171417241734174417541764177417841794180418141824183418441854186418741884189419041914192419341944195419641974198419942004201420242034204420542064207420842094210421142124213421442154216421742184219422042214222422342244225422642274228422942304231423242334234423542364237423842394240424142424243424442454246424742484249425042514252425342544255425642574258425942604261426242634264426542664267426842694270427142724273427442754276427742784279428042814282428342844285428642874288428942904291429242934294429542964297429842994300430143024303430443054306430743084309431043114312431343144315431643174318431943204321432243234324432543264327432843294330433143324333433443354336433743384339434043414342434343444345434643474348434943504351435243534354435543564357435843594360436143624363436443654366436743684369437043714372437343744375437643774378437943804381438243834384438543864387438843894390439143924393439443954396439743984399440044014402440344044405440644074408440944104411441244134414441544164417441844194420442144224423442444254426442744284429443044314432443344344435443644374438443944404441444244434444444544464447444844494450445144524453445444554456445744584459446044614462446344644465446644674468446944704471447244734474447544764477447844794480448144824483448444854486448744884489449044914492449344944495449644974498449945004501450245034504450545064507450845094510451145124513451445154516451745184519452045214522452345244525452645274528452945304531453245334534453545364537453845394540454145424543454445454546454745484549455045514552455345544555455645574558455945604561456245634564456545664567456845694570457145724573457445754576457745784579458045814582458345844585458645874588458945904591459245934594459545964597459845994600460146024603460446054606460746084609461046114612461346144615461646174618461946204621462246234624462546264627462846294630463146324633463446354636463746384639464046414642464346444645464646474648464946504651465246534654465546564657465846594660466146624663466446654666466746684669467046714672467346744675467646774678467946804681468246834684468546864687468846894690469146924693469446954696469746984699470047014702470347044705470647074708470947104711471247134714471547164717471847194720472147224723472447254726472747284729473047314732473347344735473647374738473947404741474247434744474547464747474847494750475147524753475447554756475747584759476047614762476347644765476647674768476947704771477247734774477547764777477847794780478147824783478447854786478747884789479047914792479347944795479647974798479948004801480248034804480548064807480848094810481148124813481448154816481748184819482048214822482348244825482648274828482948304831483248334834483548364837483848394840484148424843484448454846484748484849485048514852485348544855485648574858485948604861486248634864486548664867486848694870487148724873487448754876487748784879488048814882488348844885488648874888488948904891489248934894489548964897489848994900490149024903490449054906490749084909491049114912491349144915491649174918491949204921492249234924492549264927492849294930493149324933493449354936493749384939494049414942494349444945494649474948494949504951495249534954495549564957495849594960496149624963496449654966496749684969497049714972497349744975497649774978497949804981498249834984498549864987498849894990499149924993499449954996499749984999500050015002500350045005500650075008500950105011501250135014501550165017501850195020502150225023502450255026502750285029503050315032503350345035503650375038503950405041504250435044504550465047504850495050505150525053505450555056505750585059506050615062506350645065506650675068506950705071507250735074507550765077507850795080508150825083508450855086508750885089509050915092509350945095509650975098509951005101510251035104510551065107510851095110511151125113511451155116511751185119512051215122512351245125512651275128512951305131513251335134513551365137513851395140514151425143514451455146514751485149515051515152515351545155515651575158515951605161516251635164516551665167516851695170517151725173517451755176517751785179518051815182518351845185518651875188518951905191519251935194519551965197519851995200520152025203520452055206520752085209521052115212521352145215521652175218521952205221522252235224522552265227522852295230523152325233523452355236523752385239524052415242524352445245524652475248524952505251525252535254525552565257525852595260526152625263526452655266526752685269527052715272527352745275527652775278527952805281528252835284528552865287528852895290529152925293529452955296529752985299530053015302530353045305530653075308530953105311531253135314
  1. {
  2. Copyright (c) 2003 by Florian Klaempfl
  3. Member of the Free Pascal development team
  4. This unit implements the code generator for the ARM
  5. This program is free software; you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation; either version 2 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program; if not, write to the Free Software
  15. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  16. ****************************************************************************
  17. }
  18. unit cgcpu;
  19. {$i fpcdefs.inc}
  20. interface
  21. uses
  22. globtype,symtype,symdef,
  23. cgbase,cgutils,cgobj,
  24. aasmbase,aasmcpu,aasmtai,aasmdata,
  25. parabase,
  26. cpubase,cpuinfo,cg64f32,rgcpu;
  27. type
  28. { tbasecgarm is shared between all arm architectures }
  29. tbasecgarm = class(tcg)
  30. { true, if the next arithmetic operation should modify the flags }
  31. cgsetflags : boolean;
  32. procedure a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);override;
  33. procedure a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);override;
  34. procedure a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);override;
  35. procedure a_call_name(list : TAsmList;const s : string; weak: boolean);override;
  36. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  37. { move instructions }
  38. procedure a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);override;
  39. procedure a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);override;
  40. function a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  41. function a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  42. { fpu move instructions }
  43. procedure a_loadfpu_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister); override;
  44. procedure a_loadfpu_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister); override;
  45. procedure a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference); override;
  46. procedure a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);override;
  47. { comparison operations }
  48. procedure a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  49. l : tasmlabel);override;
  50. procedure a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel); override;
  51. procedure a_jmp_name(list : TAsmList;const s : string); override;
  52. procedure a_jmp_always(list : TAsmList;l: tasmlabel); override;
  53. procedure a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel); override;
  54. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  55. procedure g_profilecode(list : TAsmList); override;
  56. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  57. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  58. procedure g_maybe_got_init(list : TAsmList); override;
  59. procedure a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);override;
  60. procedure g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);override;
  61. procedure g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);override;
  62. procedure g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  63. procedure g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  64. procedure g_overflowcheck(list: TAsmList; const l: tlocation; def: tdef); override;
  65. procedure g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);override;
  66. procedure g_save_registers(list : TAsmList);override;
  67. procedure g_restore_registers(list : TAsmList);override;
  68. procedure a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  69. procedure fixref(list : TAsmList;var ref : treference);
  70. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; virtual;
  71. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  72. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  73. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  74. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  75. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  76. procedure a_opmm_reg_reg(list: TAsmList; Op: TOpCG; size : tcgsize;src,dst: tregister;shuffle : pmmshuffle); override;
  77. { Transform unsupported methods into Internal errors }
  78. procedure a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister); override;
  79. { try to generate optimized 32 Bit multiplication, returns true if successful generated }
  80. function try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  81. { clear out potential overflow bits from 8 or 16 bit operations }
  82. { the upper 24/16 bits of a register after an operation }
  83. procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  84. { mla for thumb requires that none of the registers is equal to r13/r15, this method ensures this }
  85. procedure safe_mla(list: TAsmList;op1,op2,op3,op4 : TRegister);
  86. end;
  87. { tcgarm is shared between normal arm and thumb-2 }
  88. tcgarm = class(tbasecgarm)
  89. procedure a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister); override;
  90. procedure a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference); override;
  91. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  92. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  93. size: tcgsize; a: tcgint; src, dst: tregister); override;
  94. procedure a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  95. size: tcgsize; src1, src2, dst: tregister); override;
  96. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  97. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  98. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  99. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  100. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  101. {Multiply two 32-bit registers into lo and hi 32-bit registers}
  102. procedure a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister); override;
  103. end;
  104. { normal arm cg }
  105. tarmcgarm = class(tcgarm)
  106. procedure init_register_allocators;override;
  107. procedure done_register_allocators;override;
  108. end;
  109. { 64 bit cg for all arm flavours }
  110. tbasecg64farm = class(tcg64f32)
  111. end;
  112. { tcg64farm is shared between normal arm and thumb-2 }
  113. tcg64farm = class(tbasecg64farm)
  114. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  115. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  116. procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;
  117. procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  118. procedure a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  119. procedure a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  120. procedure a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);override;
  121. procedure a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);override;
  122. end;
  123. tarmcg64farm = class(tcg64farm)
  124. end;
  125. tthumbcgarm = class(tbasecgarm)
  126. procedure init_register_allocators;override;
  127. procedure done_register_allocators;override;
  128. procedure g_proc_entry(list: TAsmList; localsize: longint; nostackframe: boolean);override;
  129. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  130. procedure a_op_reg_reg(list: TAsmList; Op: TOpCG; size: TCGSize; src,dst: TRegister);override;
  131. procedure a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);override;
  132. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister); override;
  133. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  134. procedure a_load_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const Ref: treference; reg: tregister);override;
  135. procedure a_load_const_reg(list: TAsmList; size: tcgsize; a: tcgint; reg: tregister);override;
  136. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  137. function handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference; override;
  138. end;
  139. tthumbcg64farm = class(tbasecg64farm)
  140. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  141. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  142. end;
  143. tthumb2cgarm = class(tcgarm)
  144. procedure init_register_allocators;override;
  145. procedure done_register_allocators;override;
  146. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  147. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  148. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  149. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  150. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  151. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  152. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  153. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  154. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  155. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; override;
  156. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  157. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  158. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  159. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  160. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  161. end;
  162. tthumb2cg64farm = class(tcg64farm)
  163. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  164. end;
  165. const
  166. OpCmp2AsmCond : Array[topcmp] of TAsmCond = (C_NONE,C_EQ,C_GT,
  167. C_LT,C_GE,C_LE,C_NE,C_LS,C_CC,C_CS,C_HI);
  168. winstackpagesize = 4096;
  169. function get_fpu_postfix(def : tdef) : toppostfix;
  170. procedure create_codegen;
  171. implementation
  172. uses
  173. globals,verbose,systems,cutils,
  174. aopt,aoptcpu,
  175. fmodule,
  176. symconst,symsym,symtable,
  177. tgobj,
  178. procinfo,cpupi,
  179. paramgr;
  180. function get_fpu_postfix(def : tdef) : toppostfix;
  181. begin
  182. if def.typ=floatdef then
  183. begin
  184. case tfloatdef(def).floattype of
  185. s32real:
  186. result:=PF_S;
  187. s64real:
  188. result:=PF_D;
  189. s80real:
  190. result:=PF_E;
  191. else
  192. internalerror(200401272);
  193. end;
  194. end
  195. else
  196. internalerror(200401271);
  197. end;
  198. procedure tarmcgarm.init_register_allocators;
  199. begin
  200. inherited init_register_allocators;
  201. { currently, we always save R14, so we can use it }
  202. if (target_info.system<>system_arm_darwin) then
  203. begin
  204. if assigned(current_procinfo) and (current_procinfo.framepointer<>NR_R11) then
  205. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  206. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  207. RS_R9,RS_R10,RS_R11,RS_R14],first_int_imreg,[])
  208. else
  209. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  210. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  211. RS_R9,RS_R10,RS_R14],first_int_imreg,[])
  212. end
  213. else
  214. { r7 is not available on Darwin, it's used as frame pointer (always,
  215. for backtrace support -- also in gcc/clang -> R11 can be used).
  216. r9 is volatile }
  217. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  218. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R9,RS_R12,RS_R4,RS_R5,RS_R6,RS_R8,
  219. RS_R10,RS_R11,RS_R14],first_int_imreg,[]);
  220. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  221. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  222. { The register allocator currently cannot deal with multiple
  223. non-overlapping subregs per register, so we can only use
  224. half the single precision registers for now (as sub registers of the
  225. double precision ones). }
  226. if current_settings.fputype=fpu_vfpv3 then
  227. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  228. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  229. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  230. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  231. ],first_mm_imreg,[])
  232. else
  233. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  234. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15],first_mm_imreg,[]);
  235. end;
  236. procedure tarmcgarm.done_register_allocators;
  237. begin
  238. rg[R_INTREGISTER].free;
  239. rg[R_FPUREGISTER].free;
  240. rg[R_MMREGISTER].free;
  241. inherited done_register_allocators;
  242. end;
  243. procedure tcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  244. var
  245. imm_shift : byte;
  246. l : tasmlabel;
  247. hr : treference;
  248. imm1, imm2: DWord;
  249. begin
  250. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  251. internalerror(2002090902);
  252. if is_shifter_const(a,imm_shift) then
  253. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  254. else if is_shifter_const(not(a),imm_shift) then
  255. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  256. { loading of constants with mov and orr }
  257. else if (split_into_shifter_const(a,imm1, imm2)) then
  258. begin
  259. list.concat(taicpu.op_reg_const(A_MOV,reg, imm1));
  260. list.concat(taicpu.op_reg_reg_const(A_ORR,reg,reg, imm2));
  261. end
  262. { loading of constants with mvn and bic }
  263. else if (split_into_shifter_const(not(a), imm1, imm2)) then
  264. begin
  265. list.concat(taicpu.op_reg_const(A_MVN,reg, imm1));
  266. list.concat(taicpu.op_reg_reg_const(A_BIC,reg,reg, imm2));
  267. end
  268. else
  269. begin
  270. reference_reset(hr,4);
  271. current_asmdata.getjumplabel(l);
  272. cg.a_label(current_procinfo.aktlocaldata,l);
  273. hr.symboldata:=current_procinfo.aktlocaldata.last;
  274. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  275. hr.symbol:=l;
  276. hr.base:=NR_PC;
  277. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  278. end;
  279. end;
  280. procedure tcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  281. var
  282. oppostfix:toppostfix;
  283. usedtmpref: treference;
  284. tmpreg,tmpreg2 : tregister;
  285. so : tshifterop;
  286. dir : integer;
  287. begin
  288. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  289. FromSize := ToSize;
  290. case FromSize of
  291. { signed integer registers }
  292. OS_8:
  293. oppostfix:=PF_B;
  294. OS_S8:
  295. oppostfix:=PF_SB;
  296. OS_16:
  297. oppostfix:=PF_H;
  298. OS_S16:
  299. oppostfix:=PF_SH;
  300. OS_32,
  301. OS_S32:
  302. oppostfix:=PF_None;
  303. else
  304. InternalError(200308297);
  305. end;
  306. if (fromsize=OS_S8) and
  307. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  308. oppostfix:=PF_B;
  309. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize])) or
  310. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  311. (oppostfix in [PF_SH,PF_H])) then
  312. begin
  313. if target_info.endian=endian_big then
  314. dir:=-1
  315. else
  316. dir:=1;
  317. case FromSize of
  318. OS_16,OS_S16:
  319. begin
  320. { only complicated references need an extra loadaddr }
  321. if assigned(ref.symbol) or
  322. (ref.index<>NR_NO) or
  323. (ref.offset<-4095) or
  324. (ref.offset>4094) or
  325. { sometimes the compiler reused registers }
  326. (reg=ref.index) or
  327. (reg=ref.base) then
  328. begin
  329. tmpreg2:=getintregister(list,OS_INT);
  330. a_loadaddr_ref_reg(list,ref,tmpreg2);
  331. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  332. end
  333. else
  334. usedtmpref:=ref;
  335. if target_info.endian=endian_big then
  336. inc(usedtmpref.offset,1);
  337. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  338. tmpreg:=getintregister(list,OS_INT);
  339. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  340. inc(usedtmpref.offset,dir);
  341. if FromSize=OS_16 then
  342. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  343. else
  344. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  345. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  346. end;
  347. OS_32,OS_S32:
  348. begin
  349. tmpreg:=getintregister(list,OS_INT);
  350. { only complicated references need an extra loadaddr }
  351. if assigned(ref.symbol) or
  352. (ref.index<>NR_NO) or
  353. (ref.offset<-4095) or
  354. (ref.offset>4092) or
  355. { sometimes the compiler reused registers }
  356. (reg=ref.index) or
  357. (reg=ref.base) then
  358. begin
  359. tmpreg2:=getintregister(list,OS_INT);
  360. a_loadaddr_ref_reg(list,ref,tmpreg2);
  361. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  362. end
  363. else
  364. usedtmpref:=ref;
  365. shifterop_reset(so);so.shiftmode:=SM_LSL;
  366. if ref.alignment=2 then
  367. begin
  368. if target_info.endian=endian_big then
  369. inc(usedtmpref.offset,2);
  370. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  371. inc(usedtmpref.offset,dir*2);
  372. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  373. so.shiftimm:=16;
  374. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  375. end
  376. else
  377. begin
  378. tmpreg2:=getintregister(list,OS_INT);
  379. if target_info.endian=endian_big then
  380. inc(usedtmpref.offset,3);
  381. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  382. inc(usedtmpref.offset,dir);
  383. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  384. inc(usedtmpref.offset,dir);
  385. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg2);
  386. so.shiftimm:=8;
  387. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  388. inc(usedtmpref.offset,dir);
  389. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  390. so.shiftimm:=16;
  391. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg2,so));
  392. so.shiftimm:=24;
  393. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  394. end;
  395. end
  396. else
  397. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  398. end;
  399. end
  400. else
  401. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  402. if (fromsize=OS_S8) and
  403. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  404. a_load_reg_reg(list,OS_S8,OS_32,reg,reg)
  405. else if (fromsize=OS_S8) and (tosize = OS_16) then
  406. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  407. end;
  408. procedure tcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  409. var
  410. hsym : tsym;
  411. href : treference;
  412. paraloc : Pcgparalocation;
  413. shift : byte;
  414. begin
  415. { calculate the parameter info for the procdef }
  416. procdef.init_paraloc_info(callerside);
  417. hsym:=tsym(procdef.parast.Find('self'));
  418. if not(assigned(hsym) and
  419. (hsym.typ=paravarsym)) then
  420. internalerror(200305251);
  421. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  422. while paraloc<>nil do
  423. with paraloc^ do
  424. begin
  425. case loc of
  426. LOC_REGISTER:
  427. begin
  428. if is_shifter_const(ioffset,shift) then
  429. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  430. else
  431. begin
  432. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  433. a_op_reg_reg(list,OP_SUB,size,NR_R12,register);
  434. end;
  435. end;
  436. LOC_REFERENCE:
  437. begin
  438. { offset in the wrapper needs to be adjusted for the stored
  439. return address }
  440. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),sizeof(pint));
  441. if is_shifter_const(ioffset,shift) then
  442. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  443. else
  444. begin
  445. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  446. a_op_reg_ref(list,OP_SUB,size,NR_R12,href);
  447. end;
  448. end
  449. else
  450. internalerror(200309189);
  451. end;
  452. paraloc:=next;
  453. end;
  454. end;
  455. procedure tbasecgarm.a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);
  456. var
  457. ref: treference;
  458. begin
  459. paraloc.check_simple_location;
  460. paramanager.allocparaloc(list,paraloc.location);
  461. case paraloc.location^.loc of
  462. LOC_REGISTER,LOC_CREGISTER:
  463. a_load_const_reg(list,size,a,paraloc.location^.register);
  464. LOC_REFERENCE:
  465. begin
  466. reference_reset(ref,paraloc.alignment);
  467. ref.base:=paraloc.location^.reference.index;
  468. ref.offset:=paraloc.location^.reference.offset;
  469. a_load_const_ref(list,size,a,ref);
  470. end;
  471. else
  472. internalerror(2002081101);
  473. end;
  474. end;
  475. procedure tbasecgarm.a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);
  476. var
  477. tmpref, ref: treference;
  478. location: pcgparalocation;
  479. sizeleft: aint;
  480. begin
  481. location := paraloc.location;
  482. tmpref := r;
  483. sizeleft := paraloc.intsize;
  484. while assigned(location) do
  485. begin
  486. paramanager.allocparaloc(list,location);
  487. case location^.loc of
  488. LOC_REGISTER,LOC_CREGISTER:
  489. a_load_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  490. LOC_REFERENCE:
  491. begin
  492. reference_reset_base(ref,location^.reference.index,location^.reference.offset,paraloc.alignment);
  493. { doubles in softemu mode have a strange order of registers and references }
  494. if location^.size=OS_32 then
  495. g_concatcopy(list,tmpref,ref,4)
  496. else
  497. begin
  498. g_concatcopy(list,tmpref,ref,sizeleft);
  499. if assigned(location^.next) then
  500. internalerror(2005010710);
  501. end;
  502. end;
  503. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  504. case location^.size of
  505. OS_F32, OS_F64:
  506. a_loadfpu_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  507. else
  508. internalerror(2002072801);
  509. end;
  510. LOC_VOID:
  511. begin
  512. // nothing to do
  513. end;
  514. else
  515. internalerror(2002081103);
  516. end;
  517. inc(tmpref.offset,tcgsize2size[location^.size]);
  518. dec(sizeleft,tcgsize2size[location^.size]);
  519. location := location^.next;
  520. end;
  521. end;
  522. procedure tbasecgarm.a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);
  523. var
  524. ref: treference;
  525. tmpreg: tregister;
  526. begin
  527. paraloc.check_simple_location;
  528. paramanager.allocparaloc(list,paraloc.location);
  529. case paraloc.location^.loc of
  530. LOC_REGISTER,LOC_CREGISTER:
  531. a_loadaddr_ref_reg(list,r,paraloc.location^.register);
  532. LOC_REFERENCE:
  533. begin
  534. reference_reset(ref,paraloc.alignment);
  535. ref.base := paraloc.location^.reference.index;
  536. ref.offset := paraloc.location^.reference.offset;
  537. tmpreg := getintregister(list,OS_ADDR);
  538. a_loadaddr_ref_reg(list,r,tmpreg);
  539. a_load_reg_ref(list,OS_ADDR,OS_ADDR,tmpreg,ref);
  540. end;
  541. else
  542. internalerror(2002080701);
  543. end;
  544. end;
  545. procedure tbasecgarm.a_call_name(list : TAsmList;const s : string; weak: boolean);
  546. var
  547. branchopcode: tasmop;
  548. r : treference;
  549. sym : TAsmSymbol;
  550. begin
  551. { check not really correct: should only be used for non-Thumb cpus }
  552. if (CPUARM_HAS_BLX_LABEL in cpu_capabilities[current_settings.cputype]) and
  553. { WinCE GNU AS (not sure if this applies in general) does not support BLX imm }
  554. (target_info.system<>system_arm_wince) then
  555. branchopcode:=A_BLX
  556. else
  557. branchopcode:=A_BL;
  558. if not(weak) then
  559. sym:=current_asmdata.RefAsmSymbol(s)
  560. else
  561. sym:=current_asmdata.WeakRefAsmSymbol(s);
  562. reference_reset_symbol(r,sym,0,sizeof(pint));
  563. if (tf_pic_uses_got in target_info.flags) and
  564. (cs_create_pic in current_settings.moduleswitches) then
  565. begin
  566. r.refaddr:=addr_pic
  567. end
  568. else
  569. r.refaddr:=addr_full;
  570. list.concat(taicpu.op_ref(branchopcode,r));
  571. {
  572. the compiler does not properly set this flag anymore in pass 1, and
  573. for now we only need it after pass 2 (I hope) (JM)
  574. if not(pi_do_call in current_procinfo.flags) then
  575. internalerror(2003060703);
  576. }
  577. include(current_procinfo.flags,pi_do_call);
  578. end;
  579. procedure tbasecgarm.a_call_reg(list : TAsmList;reg: tregister);
  580. begin
  581. { check not really correct: should only be used for non-Thumb cpus }
  582. if not(CPUARM_HAS_BLX in cpu_capabilities[current_settings.cputype]) then
  583. begin
  584. list.concat(taicpu.op_reg_reg(A_MOV,NR_R14,NR_PC));
  585. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,reg));
  586. end
  587. else
  588. list.concat(taicpu.op_reg(A_BLX, reg));
  589. {
  590. the compiler does not properly set this flag anymore in pass 1, and
  591. for now we only need it after pass 2 (I hope) (JM)
  592. if not(pi_do_call in current_procinfo.flags) then
  593. internalerror(2003060703);
  594. }
  595. include(current_procinfo.flags,pi_do_call);
  596. end;
  597. procedure tcgarm.a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister);
  598. begin
  599. a_op_const_reg_reg(list,op,size,a,reg,reg);
  600. end;
  601. procedure tcgarm.a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference);
  602. var
  603. tmpreg,tmpresreg : tregister;
  604. tmpref : treference;
  605. begin
  606. tmpreg:=getintregister(list,size);
  607. tmpresreg:=getintregister(list,size);
  608. tmpref:=a_internal_load_ref_reg(list,size,size,ref,tmpreg);
  609. a_op_const_reg_reg(list,op,size,a,tmpreg,tmpresreg);
  610. a_load_reg_ref(list,size,size,tmpresreg,tmpref);
  611. end;
  612. procedure tcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  613. var
  614. so : tshifterop;
  615. begin
  616. if op = OP_NEG then
  617. begin
  618. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,src,0));
  619. maybeadjustresult(list,OP_NEG,size,dst);
  620. end
  621. else if op = OP_NOT then
  622. begin
  623. if size in [OS_8, OS_16, OS_S8, OS_S16] then
  624. begin
  625. shifterop_reset(so);
  626. so.shiftmode:=SM_LSL;
  627. if size in [OS_8, OS_S8] then
  628. so.shiftimm:=24
  629. else
  630. so.shiftimm:=16;
  631. list.concat(taicpu.op_reg_reg_shifterop(A_MVN,dst,src,so));
  632. {Using a shift here allows this to be folded into another instruction}
  633. if size in [OS_S8, OS_S16] then
  634. so.shiftmode:=SM_ASR
  635. else
  636. so.shiftmode:=SM_LSR;
  637. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  638. end
  639. else
  640. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  641. end
  642. else
  643. a_op_reg_reg_reg(list,op,size,src,dst,dst);
  644. end;
  645. const
  646. op_reg_reg_opcg2asmop: array[TOpCG] of tasmop =
  647. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  648. A_NONE,A_NONE,A_NONE,A_SUB,A_EOR,A_NONE,A_NONE);
  649. op_reg_opcg2asmop: array[TOpCG] of tasmop =
  650. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  651. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  652. op_reg_postfix: array[TOpCG] of TOpPostfix =
  653. (PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,
  654. PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None);
  655. procedure tcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  656. size: tcgsize; a: tcgint; src, dst: tregister);
  657. var
  658. ovloc : tlocation;
  659. begin
  660. a_op_const_reg_reg_checkoverflow(list,op,size,a,src,dst,false,ovloc);
  661. end;
  662. procedure tcgarm.a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  663. size: tcgsize; src1, src2, dst: tregister);
  664. var
  665. ovloc : tlocation;
  666. begin
  667. a_op_reg_reg_reg_checkoverflow(list,op,size,src1,src2,dst,false,ovloc);
  668. end;
  669. function opshift2shiftmode(op: TOpCg): tshiftmode;
  670. begin
  671. case op of
  672. OP_SHL: Result:=SM_LSL;
  673. OP_SHR: Result:=SM_LSR;
  674. OP_ROR: Result:=SM_ROR;
  675. OP_ROL: Result:=SM_ROR;
  676. OP_SAR: Result:=SM_ASR;
  677. else internalerror(2012070501);
  678. end
  679. end;
  680. function tbasecgarm.try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  681. var
  682. multiplier : dword;
  683. power : longint;
  684. shifterop : tshifterop;
  685. bitsset : byte;
  686. negative : boolean;
  687. first : boolean;
  688. b,
  689. cycles : byte;
  690. maxeffort : byte;
  691. begin
  692. result:=true;
  693. cycles:=0;
  694. negative:=a<0;
  695. shifterop.rs:=NR_NO;
  696. shifterop.shiftmode:=SM_LSL;
  697. if negative then
  698. inc(cycles);
  699. multiplier:=dword(abs(a));
  700. bitsset:=popcnt(multiplier and $fffffffe);
  701. { heuristics to estimate how much instructions are reasonable to replace the mul,
  702. this is currently based on XScale timings }
  703. { in the simplest case, we need a mov to load the constant and a mul to carry out the
  704. actual multiplication, this requires min. 1+4 cycles
  705. because the first shift imm. might cause a stall and because we need more instructions
  706. when replacing the mul we generate max. 3 instructions to replace this mul }
  707. maxeffort:=3;
  708. { if the constant is not a shifter op, we need either some mov/mvn/bic/or sequence or
  709. a ldr, so generating one more operation to replace this is beneficial }
  710. if not(is_shifter_const(dword(a),b)) and not(is_shifter_const(not(dword(a)),b)) then
  711. inc(maxeffort);
  712. { if the upper 5 bits are all set or clear, mul is one cycle faster }
  713. if ((dword(a) and $f8000000)=0) or ((dword(a) and $f8000000)=$f8000000) then
  714. dec(maxeffort);
  715. { if the upper 17 bits are all set or clear, mul is another cycle faster }
  716. if ((dword(a) and $ffff8000)=0) or ((dword(a) and $ffff8000)=$ffff8000) then
  717. dec(maxeffort);
  718. { most simple cases }
  719. if a=1 then
  720. a_load_reg_reg(list,OS_32,OS_32,src,dst)
  721. else if a=0 then
  722. a_load_const_reg(list,OS_32,0,dst)
  723. else if a=-1 then
  724. a_op_reg_reg(list,OP_NEG,OS_32,src,dst)
  725. { add up ?
  726. basically, one add is needed for each bit being set in the constant factor
  727. however, the least significant bit is for free, it can be hidden in the initial
  728. instruction
  729. }
  730. else if (bitsset+cycles<=maxeffort) and
  731. (bitsset<=popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)) then
  732. begin
  733. first:=true;
  734. while multiplier<>0 do
  735. begin
  736. shifterop.shiftimm:=BsrDWord(multiplier);
  737. if odd(multiplier) then
  738. begin
  739. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,shifterop));
  740. dec(multiplier);
  741. end
  742. else
  743. if first then
  744. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  745. else
  746. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,src,shifterop));
  747. first:=false;
  748. dec(multiplier,1 shl shifterop.shiftimm);
  749. end;
  750. if negative then
  751. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  752. end
  753. { subtract from the next greater power of two? }
  754. else if popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)+cycles+1<=maxeffort then
  755. begin
  756. first:=true;
  757. while multiplier<>0 do
  758. begin
  759. if first then
  760. begin
  761. multiplier:=(1 shl power)-multiplier;
  762. shifterop.shiftimm:=power;
  763. end
  764. else
  765. shifterop.shiftimm:=BsrDWord(multiplier);
  766. if odd(multiplier) then
  767. begin
  768. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,shifterop));
  769. dec(multiplier);
  770. end
  771. else
  772. if first then
  773. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  774. else
  775. begin
  776. list.concat(taicpu.op_reg_reg_reg_shifterop(A_SUB,dst,dst,src,shifterop));
  777. dec(multiplier,1 shl shifterop.shiftimm);
  778. end;
  779. first:=false;
  780. end;
  781. if negative then
  782. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  783. end
  784. else
  785. result:=false;
  786. end;
  787. procedure tcgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  788. var
  789. shift, lsb, width : byte;
  790. tmpreg : tregister;
  791. so : tshifterop;
  792. l1 : longint;
  793. imm1, imm2: DWord;
  794. begin
  795. optimize_op_const(size, op, a);
  796. case op of
  797. OP_NONE:
  798. begin
  799. if src <> dst then
  800. a_load_reg_reg(list, size, size, src, dst);
  801. exit;
  802. end;
  803. OP_MOVE:
  804. begin
  805. a_load_const_reg(list, size, a, dst);
  806. exit;
  807. end;
  808. end;
  809. ovloc.loc:=LOC_VOID;
  810. if {$ifopt R+}(a<>-2147483648) and{$endif} not setflags and is_shifter_const(-a,shift) then
  811. case op of
  812. OP_ADD:
  813. begin
  814. op:=OP_SUB;
  815. a:=aint(dword(-a));
  816. end;
  817. OP_SUB:
  818. begin
  819. op:=OP_ADD;
  820. a:=aint(dword(-a));
  821. end
  822. end;
  823. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  824. case op of
  825. OP_NEG,OP_NOT:
  826. internalerror(200308281);
  827. OP_SHL,
  828. OP_SHR,
  829. OP_ROL,
  830. OP_ROR,
  831. OP_SAR:
  832. begin
  833. if a>32 then
  834. internalerror(200308294);
  835. shifterop_reset(so);
  836. so.shiftmode:=opshift2shiftmode(op);
  837. if op = OP_ROL then
  838. so.shiftimm:=32-a
  839. else
  840. so.shiftimm:=a;
  841. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  842. end;
  843. else
  844. {if (op in [OP_SUB, OP_ADD]) and
  845. ((a < 0) or
  846. (a > 4095)) then
  847. begin
  848. tmpreg:=getintregister(list,size);
  849. list.concat(taicpu.op_reg_const(A_MOVT, tmpreg, (a shr 16) and $FFFF));
  850. list.concat(taicpu.op_reg_const(A_MOV, tmpreg, a and $FFFF));
  851. list.concat(setoppostfix(taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))
  852. ));
  853. end
  854. else}
  855. begin
  856. if cgsetflags or setflags then
  857. a_reg_alloc(list,NR_DEFAULTFLAGS);
  858. list.concat(setoppostfix(
  859. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  860. end;
  861. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  862. begin
  863. ovloc.loc:=LOC_FLAGS;
  864. case op of
  865. OP_ADD:
  866. ovloc.resflags:=F_CS;
  867. OP_SUB:
  868. ovloc.resflags:=F_CC;
  869. end;
  870. end;
  871. end
  872. else
  873. begin
  874. { there could be added some more sophisticated optimizations }
  875. if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  876. a_op_reg_reg(list,OP_NEG,size,src,dst)
  877. { we do this here instead in the peephole optimizer because
  878. it saves us a register }
  879. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  880. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  881. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  882. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  883. begin
  884. if l1>32 then{roozbeh does this ever happen?}
  885. internalerror(200308296);
  886. shifterop_reset(so);
  887. so.shiftmode:=SM_LSL;
  888. so.shiftimm:=l1;
  889. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  890. end
  891. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  892. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  893. begin
  894. if l1>32 then{does this ever happen?}
  895. internalerror(201205181);
  896. shifterop_reset(so);
  897. so.shiftmode:=SM_LSL;
  898. so.shiftimm:=l1;
  899. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  900. end
  901. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  902. begin
  903. { nothing to do on success }
  904. end
  905. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  906. broader range of shifterconstants.}
  907. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  908. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  909. { Doing two shifts instead of two bics might allow the peephole optimizer to fold the second shift
  910. into the following instruction}
  911. else if (op = OP_AND) and
  912. is_continuous_mask(a, lsb, width) and
  913. ((lsb = 0) or ((lsb + width) = 32)) then
  914. begin
  915. shifterop_reset(so);
  916. if (width = 16) and
  917. (lsb = 0) and
  918. (current_settings.cputype >= cpu_armv6) then
  919. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  920. else if (width = 8) and
  921. (lsb = 0) and
  922. (current_settings.cputype >= cpu_armv6) then
  923. list.concat(taicpu.op_reg_reg(A_UXTB,dst,src))
  924. else if lsb = 0 then
  925. begin
  926. so.shiftmode:=SM_LSL;
  927. so.shiftimm:=32-width;
  928. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  929. so.shiftmode:=SM_LSR;
  930. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  931. end
  932. else
  933. begin
  934. so.shiftmode:=SM_LSR;
  935. so.shiftimm:=lsb;
  936. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  937. so.shiftmode:=SM_LSL;
  938. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  939. end;
  940. end
  941. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  942. begin
  943. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,imm1));
  944. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  945. end
  946. else if (op in [OP_ADD, OP_SUB, OP_OR, OP_XOR]) and
  947. not(cgsetflags or setflags) and
  948. split_into_shifter_const(a, imm1, imm2) then
  949. begin
  950. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,imm1));
  951. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  952. end
  953. else
  954. begin
  955. tmpreg:=getintregister(list,size);
  956. a_load_const_reg(list,size,a,tmpreg);
  957. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  958. end;
  959. end;
  960. maybeadjustresult(list,op,size,dst);
  961. end;
  962. procedure tcgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  963. var
  964. so : tshifterop;
  965. tmpreg,overflowreg : tregister;
  966. asmop : tasmop;
  967. begin
  968. ovloc.loc:=LOC_VOID;
  969. case op of
  970. OP_NEG,OP_NOT,
  971. OP_DIV,OP_IDIV:
  972. internalerror(200308283);
  973. OP_SHL,
  974. OP_SHR,
  975. OP_SAR,
  976. OP_ROR:
  977. begin
  978. if (op = OP_ROR) and not(size in [OS_32,OS_S32]) then
  979. internalerror(2008072801);
  980. shifterop_reset(so);
  981. so.rs:=src1;
  982. so.shiftmode:=opshift2shiftmode(op);
  983. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  984. end;
  985. OP_ROL:
  986. begin
  987. if not(size in [OS_32,OS_S32]) then
  988. internalerror(2008072801);
  989. { simulate ROL by ror'ing 32-value }
  990. tmpreg:=getintregister(list,OS_32);
  991. list.concat(taicpu.op_reg_reg_const(A_RSB,tmpreg,src1, 32));
  992. shifterop_reset(so);
  993. so.rs:=tmpreg;
  994. so.shiftmode:=SM_ROR;
  995. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  996. end;
  997. OP_IMUL,
  998. OP_MUL:
  999. begin
  1000. if (cgsetflags or setflags) and
  1001. (CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype]) then
  1002. begin
  1003. overflowreg:=getintregister(list,size);
  1004. if op=OP_IMUL then
  1005. asmop:=A_SMULL
  1006. else
  1007. asmop:=A_UMULL;
  1008. { the arm doesn't allow that rd and rm are the same }
  1009. if dst=src2 then
  1010. begin
  1011. if dst<>src1 then
  1012. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  1013. else
  1014. begin
  1015. tmpreg:=getintregister(list,size);
  1016. a_load_reg_reg(list,size,size,src2,dst);
  1017. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  1018. end;
  1019. end
  1020. else
  1021. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  1022. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1023. if op=OP_IMUL then
  1024. begin
  1025. shifterop_reset(so);
  1026. so.shiftmode:=SM_ASR;
  1027. so.shiftimm:=31;
  1028. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  1029. end
  1030. else
  1031. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  1032. ovloc.loc:=LOC_FLAGS;
  1033. ovloc.resflags:=F_NE;
  1034. end
  1035. else
  1036. begin
  1037. { the arm doesn't allow that rd and rm are the same }
  1038. if dst=src2 then
  1039. begin
  1040. if dst<>src1 then
  1041. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  1042. else
  1043. begin
  1044. tmpreg:=getintregister(list,size);
  1045. a_load_reg_reg(list,size,size,src2,dst);
  1046. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  1047. end;
  1048. end
  1049. else
  1050. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  1051. end;
  1052. end;
  1053. else
  1054. begin
  1055. if cgsetflags or setflags then
  1056. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1057. list.concat(setoppostfix(
  1058. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  1059. end;
  1060. end;
  1061. maybeadjustresult(list,op,size,dst);
  1062. end;
  1063. procedure tcgarm.a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister);
  1064. var
  1065. asmop: tasmop;
  1066. begin
  1067. if CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype] then
  1068. begin
  1069. list.concat(tai_comment.create(strpnew('tcgarm.a_mul_reg_reg_pair called')));
  1070. case size of
  1071. OS_32: asmop:=A_UMULL;
  1072. OS_S32: asmop:=A_SMULL;
  1073. else
  1074. InternalError(2014060802);
  1075. end;
  1076. { The caller might omit dstlo or dsthi, when he is not interested in it, we still
  1077. need valid registers everywhere. In case of dsthi = NR_NO we could fall back to
  1078. 32x32=32 bit multiplication}
  1079. if (dstlo = NR_NO) then
  1080. dstlo:=getintregister(list,size);
  1081. if (dsthi = NR_NO) then
  1082. dsthi:=getintregister(list,size);
  1083. list.concat(taicpu.op_reg_reg_reg_reg(asmop, dstlo, dsthi, src1,src2));
  1084. end
  1085. else if dsthi=NR_NO then
  1086. begin
  1087. if (dstlo = NR_NO) then
  1088. dstlo:=getintregister(list,size);
  1089. list.concat(taicpu.op_reg_reg_reg(A_MUL, dstlo, src1,src2));
  1090. end
  1091. else
  1092. begin
  1093. internalerror(2015083022);
  1094. end;
  1095. end;
  1096. function tbasecgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  1097. var
  1098. tmpreg1,tmpreg2 : tregister;
  1099. begin
  1100. tmpreg1:=NR_NO;
  1101. { Be sure to have a base register }
  1102. if (ref.base=NR_NO) then
  1103. begin
  1104. if ref.shiftmode<>SM_None then
  1105. internalerror(2014020701);
  1106. ref.base:=ref.index;
  1107. ref.index:=NR_NO;
  1108. end;
  1109. { absolute symbols can't be handled directly, we've to store the symbol reference
  1110. in the text segment and access it pc relative
  1111. For now, we assume that references where base or index equals to PC are already
  1112. relative, all other references are assumed to be absolute and thus they need
  1113. to be handled extra.
  1114. A proper solution would be to change refoptions to a set and store the information
  1115. if the symbol is absolute or relative there.
  1116. }
  1117. if (assigned(ref.symbol) and
  1118. not(is_pc(ref.base)) and
  1119. not(is_pc(ref.index))
  1120. ) or
  1121. { [#xxx] isn't a valid address operand }
  1122. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  1123. (ref.offset<-4095) or
  1124. (ref.offset>4095) or
  1125. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  1126. ((ref.offset<-255) or
  1127. (ref.offset>255)
  1128. )
  1129. ) or
  1130. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1131. ((ref.offset<-1020) or
  1132. (ref.offset>1020) or
  1133. ((abs(ref.offset) mod 4)<>0)
  1134. )
  1135. ) or
  1136. ((GenerateThumbCode) and
  1137. (((oppostfix in [PF_SB,PF_SH]) and (ref.offset<>0)) or
  1138. ((oppostfix=PF_None) and ((ref.offset<0) or ((ref.base<>NR_STACK_POINTER_REG) and (ref.offset>124)) or
  1139. ((ref.base=NR_STACK_POINTER_REG) and (ref.offset>1020)) or ((ref.offset mod 4)<>0))) or
  1140. ((oppostfix=PF_H) and ((ref.offset<0) or (ref.offset>62) or ((ref.offset mod 2)<>0) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0)))) or
  1141. ((oppostfix=PF_B) and ((ref.offset<0) or (ref.offset>31) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0))))
  1142. )
  1143. ) then
  1144. begin
  1145. fixref(list,ref);
  1146. end;
  1147. if GenerateThumbCode then
  1148. begin
  1149. { certain thumb load require base and index }
  1150. if (oppostfix in [PF_SB,PF_SH]) and
  1151. (ref.base<>NR_NO) and (ref.index=NR_NO) then
  1152. begin
  1153. tmpreg1:=getintregister(list,OS_ADDR);
  1154. a_load_const_reg(list,OS_ADDR,0,tmpreg1);
  1155. ref.index:=tmpreg1;
  1156. end;
  1157. { "hi" registers cannot be used as base or index }
  1158. if (getsupreg(ref.base) in [RS_R8..RS_R12,RS_R14]) or
  1159. ((ref.base=NR_R13) and (ref.index<>NR_NO)) then
  1160. begin
  1161. tmpreg1:=getintregister(list,OS_ADDR);
  1162. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.base,tmpreg1);
  1163. ref.base:=tmpreg1;
  1164. end;
  1165. if getsupreg(ref.index) in [RS_R8..RS_R14] then
  1166. begin
  1167. tmpreg1:=getintregister(list,OS_ADDR);
  1168. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.index,tmpreg1);
  1169. ref.index:=tmpreg1;
  1170. end;
  1171. end;
  1172. { fold if there is base, index and offset, however, don't fold
  1173. for vfp memory instructions because we later fold the index }
  1174. if not((op in [A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1175. (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  1176. begin
  1177. if tmpreg1<>NR_NO then
  1178. begin
  1179. tmpreg2:=getintregister(list,OS_ADDR);
  1180. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg1,tmpreg2);
  1181. tmpreg1:=tmpreg2;
  1182. end
  1183. else
  1184. begin
  1185. tmpreg1:=getintregister(list,OS_ADDR);
  1186. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg1);
  1187. ref.base:=tmpreg1;
  1188. end;
  1189. ref.offset:=0;
  1190. end;
  1191. { floating point operations have only limited references
  1192. we expect here, that a base is already set }
  1193. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  1194. begin
  1195. if ref.shiftmode<>SM_none then
  1196. internalerror(200309121);
  1197. if tmpreg1<>NR_NO then
  1198. begin
  1199. if ref.base=tmpreg1 then
  1200. begin
  1201. if ref.signindex<0 then
  1202. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,tmpreg1,ref.index))
  1203. else
  1204. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,tmpreg1,ref.index));
  1205. ref.index:=NR_NO;
  1206. end
  1207. else
  1208. begin
  1209. if ref.index<>tmpreg1 then
  1210. internalerror(200403161);
  1211. if ref.signindex<0 then
  1212. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,ref.base,tmpreg1))
  1213. else
  1214. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,tmpreg1));
  1215. ref.base:=tmpreg1;
  1216. ref.index:=NR_NO;
  1217. end;
  1218. end
  1219. else
  1220. begin
  1221. tmpreg1:=getintregister(list,OS_ADDR);
  1222. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,ref.index));
  1223. ref.base:=tmpreg1;
  1224. ref.index:=NR_NO;
  1225. end;
  1226. end;
  1227. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  1228. Result := ref;
  1229. end;
  1230. procedure tbasecgarm.a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);
  1231. var
  1232. oppostfix:toppostfix;
  1233. usedtmpref: treference;
  1234. tmpreg : tregister;
  1235. dir : integer;
  1236. begin
  1237. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  1238. FromSize := ToSize;
  1239. case ToSize of
  1240. { signed integer registers }
  1241. OS_8,
  1242. OS_S8:
  1243. oppostfix:=PF_B;
  1244. OS_16,
  1245. OS_S16:
  1246. oppostfix:=PF_H;
  1247. OS_32,
  1248. OS_S32,
  1249. { for vfp value stored in integer register }
  1250. OS_F32:
  1251. oppostfix:=PF_None;
  1252. else
  1253. InternalError(200308299);
  1254. end;
  1255. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[tosize])) or
  1256. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  1257. (oppostfix =PF_H)) then
  1258. begin
  1259. if target_info.endian=endian_big then
  1260. dir:=-1
  1261. else
  1262. dir:=1;
  1263. case FromSize of
  1264. OS_16,OS_S16:
  1265. begin
  1266. tmpreg:=getintregister(list,OS_INT);
  1267. usedtmpref:=ref;
  1268. if target_info.endian=endian_big then
  1269. inc(usedtmpref.offset,1);
  1270. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1271. inc(usedtmpref.offset,dir);
  1272. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1273. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1274. end;
  1275. OS_32,OS_S32:
  1276. begin
  1277. tmpreg:=getintregister(list,OS_INT);
  1278. usedtmpref:=ref;
  1279. if ref.alignment=2 then
  1280. begin
  1281. if target_info.endian=endian_big then
  1282. inc(usedtmpref.offset,2);
  1283. usedtmpref:=a_internal_load_reg_ref(list,OS_16,OS_16,reg,usedtmpref);
  1284. a_op_const_reg_reg(list,OP_SHR,OS_INT,16,reg,tmpreg);
  1285. inc(usedtmpref.offset,dir*2);
  1286. a_internal_load_reg_ref(list,OS_16,OS_16,tmpreg,usedtmpref);
  1287. end
  1288. else
  1289. begin
  1290. if target_info.endian=endian_big then
  1291. inc(usedtmpref.offset,3);
  1292. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1293. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1294. inc(usedtmpref.offset,dir);
  1295. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1296. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1297. inc(usedtmpref.offset,dir);
  1298. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1299. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1300. inc(usedtmpref.offset,dir);
  1301. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1302. end;
  1303. end
  1304. else
  1305. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1306. end;
  1307. end
  1308. else
  1309. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1310. end;
  1311. function tbasecgarm.a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  1312. var
  1313. oppostfix:toppostfix;
  1314. href: treference;
  1315. tmpreg: TRegister;
  1316. begin
  1317. case ToSize of
  1318. { signed integer registers }
  1319. OS_8,
  1320. OS_S8:
  1321. oppostfix:=PF_B;
  1322. OS_16,
  1323. OS_S16:
  1324. oppostfix:=PF_H;
  1325. OS_32,
  1326. OS_S32:
  1327. oppostfix:=PF_None;
  1328. else
  1329. InternalError(2003082910);
  1330. end;
  1331. if (tosize in [OS_S16,OS_16]) and
  1332. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1333. begin
  1334. result:=handle_load_store(list,A_STR,PF_B,reg,ref);
  1335. tmpreg:=getintregister(list,OS_INT);
  1336. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1337. href:=result;
  1338. inc(href.offset);
  1339. handle_load_store(list,A_STR,PF_B,tmpreg,href);
  1340. end
  1341. else
  1342. result:=handle_load_store(list,A_STR,oppostfix,reg,ref);
  1343. end;
  1344. function tbasecgarm.a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  1345. var
  1346. oppostfix:toppostfix;
  1347. so: tshifterop;
  1348. tmpreg: TRegister;
  1349. href: treference;
  1350. begin
  1351. case FromSize of
  1352. { signed integer registers }
  1353. OS_8:
  1354. oppostfix:=PF_B;
  1355. OS_S8:
  1356. oppostfix:=PF_SB;
  1357. OS_16:
  1358. oppostfix:=PF_H;
  1359. OS_S16:
  1360. oppostfix:=PF_SH;
  1361. OS_32,
  1362. OS_S32:
  1363. oppostfix:=PF_None;
  1364. else
  1365. InternalError(200308291);
  1366. end;
  1367. if (tosize=OS_S8) and
  1368. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1369. begin
  1370. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1371. a_load_reg_reg(list,OS_S8,OS_32,reg,reg);
  1372. end
  1373. else if (tosize in [OS_S16,OS_16]) and
  1374. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1375. begin
  1376. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1377. tmpreg:=getintregister(list,OS_INT);
  1378. href:=result;
  1379. inc(href.offset);
  1380. handle_load_store(list,A_LDR,PF_B,tmpreg,href);
  1381. shifterop_reset(so);
  1382. so.shiftmode:=SM_LSL;
  1383. so.shiftimm:=8;
  1384. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  1385. end
  1386. else
  1387. result:=handle_load_store(list,A_LDR,oppostfix,reg,ref);
  1388. end;
  1389. procedure tbasecgarm.a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);
  1390. var
  1391. so : tshifterop;
  1392. procedure do_shift(shiftmode : tshiftmode; shiftimm : byte; reg : tregister);
  1393. begin
  1394. if GenerateThumbCode then
  1395. begin
  1396. case shiftmode of
  1397. SM_ASR:
  1398. a_op_const_reg_reg(list,OP_SAR,OS_32,shiftimm,reg,reg2);
  1399. SM_LSR:
  1400. a_op_const_reg_reg(list,OP_SHR,OS_32,shiftimm,reg,reg2);
  1401. SM_LSL:
  1402. a_op_const_reg_reg(list,OP_SHL,OS_32,shiftimm,reg,reg2);
  1403. else
  1404. internalerror(2013090301);
  1405. end;
  1406. end
  1407. else
  1408. begin
  1409. so.shiftmode:=shiftmode;
  1410. so.shiftimm:=shiftimm;
  1411. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,reg2,reg,so));
  1412. end;
  1413. end;
  1414. var
  1415. instr: taicpu;
  1416. conv_done: boolean;
  1417. begin
  1418. if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then
  1419. internalerror(2002090901);
  1420. conv_done:=false;
  1421. if tosize<>fromsize then
  1422. begin
  1423. shifterop_reset(so);
  1424. conv_done:=true;
  1425. if tcgsize2size[tosize]<=tcgsize2size[fromsize] then
  1426. fromsize:=tosize;
  1427. if current_settings.cputype<cpu_armv6 then
  1428. case fromsize of
  1429. OS_8:
  1430. if GenerateThumbCode then
  1431. a_op_const_reg_reg(list,OP_AND,OS_32,$ff,reg1,reg2)
  1432. else
  1433. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1434. OS_S8:
  1435. begin
  1436. do_shift(SM_LSL,24,reg1);
  1437. if tosize=OS_16 then
  1438. begin
  1439. do_shift(SM_ASR,8,reg2);
  1440. do_shift(SM_LSR,16,reg2);
  1441. end
  1442. else
  1443. do_shift(SM_ASR,24,reg2);
  1444. end;
  1445. OS_16:
  1446. begin
  1447. do_shift(SM_LSL,16,reg1);
  1448. do_shift(SM_LSR,16,reg2);
  1449. end;
  1450. OS_S16:
  1451. begin
  1452. do_shift(SM_LSL,16,reg1);
  1453. do_shift(SM_ASR,16,reg2)
  1454. end;
  1455. else
  1456. conv_done:=false;
  1457. end
  1458. else
  1459. case fromsize of
  1460. OS_8:
  1461. if GenerateThumbCode then
  1462. list.concat(taicpu.op_reg_reg(A_UXTB,reg2,reg1))
  1463. else
  1464. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1465. OS_S8:
  1466. begin
  1467. if tosize=OS_16 then
  1468. begin
  1469. so.shiftmode:=SM_ROR;
  1470. so.shiftimm:=16;
  1471. list.concat(taicpu.op_reg_reg_shifterop(A_SXTB16,reg2,reg1,so));
  1472. do_shift(SM_LSR,16,reg2);
  1473. end
  1474. else
  1475. list.concat(taicpu.op_reg_reg(A_SXTB,reg2,reg1));
  1476. end;
  1477. OS_16:
  1478. list.concat(taicpu.op_reg_reg(A_UXTH,reg2,reg1));
  1479. OS_S16:
  1480. list.concat(taicpu.op_reg_reg(A_SXTH,reg2,reg1));
  1481. else
  1482. conv_done:=false;
  1483. end
  1484. end;
  1485. if not conv_done and (reg1<>reg2) then
  1486. begin
  1487. { same size, only a register mov required }
  1488. instr:=taicpu.op_reg_reg(A_MOV,reg2,reg1);
  1489. list.Concat(instr);
  1490. { Notify the register allocator that we have written a move instruction so
  1491. it can try to eliminate it. }
  1492. add_move_instruction(instr);
  1493. end;
  1494. end;
  1495. procedure tbasecgarm.a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);
  1496. var
  1497. href,href2 : treference;
  1498. hloc : pcgparalocation;
  1499. begin
  1500. href:=ref;
  1501. hloc:=paraloc.location;
  1502. while assigned(hloc) do
  1503. begin
  1504. case hloc^.loc of
  1505. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  1506. begin
  1507. paramanager.allocparaloc(list,paraloc.location);
  1508. a_loadfpu_ref_reg(list,size,size,ref,hloc^.register);
  1509. end;
  1510. LOC_REGISTER :
  1511. case hloc^.size of
  1512. OS_32,
  1513. OS_F32:
  1514. begin
  1515. paramanager.allocparaloc(list,paraloc.location);
  1516. a_load_ref_reg(list,OS_32,OS_32,href,hloc^.register);
  1517. end;
  1518. OS_64,
  1519. OS_F64:
  1520. cg64.a_load64_ref_cgpara(list,href,paraloc);
  1521. else
  1522. a_load_ref_reg(list,hloc^.size,hloc^.size,href,hloc^.register);
  1523. end;
  1524. LOC_REFERENCE :
  1525. begin
  1526. reference_reset_base(href2,hloc^.reference.index,hloc^.reference.offset,paraloc.alignment);
  1527. { concatcopy should choose the best way to copy the data }
  1528. g_concatcopy(list,href,href2,tcgsize2size[hloc^.size]);
  1529. end;
  1530. else
  1531. internalerror(200408241);
  1532. end;
  1533. inc(href.offset,tcgsize2size[hloc^.size]);
  1534. hloc:=hloc^.next;
  1535. end;
  1536. end;
  1537. procedure tbasecgarm.a_loadfpu_reg_reg(list: TAsmList; fromsize,tosize: tcgsize; reg1, reg2: tregister);
  1538. begin
  1539. list.concat(setoppostfix(taicpu.op_reg_reg(A_MVF,reg2,reg1),cgsize2fpuoppostfix[tosize]));
  1540. end;
  1541. procedure tbasecgarm.a_loadfpu_ref_reg(list: TAsmList; fromsize,tosize: tcgsize; const ref: treference; reg: tregister);
  1542. var
  1543. oppostfix:toppostfix;
  1544. begin
  1545. case fromsize of
  1546. OS_32,
  1547. OS_F32:
  1548. oppostfix:=PF_S;
  1549. OS_64,
  1550. OS_F64:
  1551. oppostfix:=PF_D;
  1552. OS_F80:
  1553. oppostfix:=PF_E;
  1554. else
  1555. InternalError(200309021);
  1556. end;
  1557. handle_load_store(list,A_LDF,oppostfix,reg,ref);
  1558. if fromsize<>tosize then
  1559. a_loadfpu_reg_reg(list,fromsize,tosize,reg,reg);
  1560. end;
  1561. procedure tbasecgarm.a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);
  1562. var
  1563. oppostfix:toppostfix;
  1564. begin
  1565. case tosize of
  1566. OS_F32:
  1567. oppostfix:=PF_S;
  1568. OS_F64:
  1569. oppostfix:=PF_D;
  1570. OS_F80:
  1571. oppostfix:=PF_E;
  1572. else
  1573. InternalError(200309022);
  1574. end;
  1575. handle_load_store(list,A_STF,oppostfix,reg,ref);
  1576. end;
  1577. { comparison operations }
  1578. procedure tbasecgarm.a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  1579. l : tasmlabel);
  1580. var
  1581. tmpreg : tregister;
  1582. b : byte;
  1583. begin
  1584. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1585. if (not(GenerateThumbCode) and is_shifter_const(a,b)) or
  1586. ((GenerateThumbCode) and is_thumb_imm(a)) then
  1587. list.concat(taicpu.op_reg_const(A_CMP,reg,a))
  1588. { CMN reg,0 and CMN reg,$80000000 are different from CMP reg,$ffffffff
  1589. and CMP reg,$7fffffff regarding the flags according to the ARM manual }
  1590. else if (a<>$7fffffff) and (a<>-1) and not(GenerateThumbCode) and is_shifter_const(-a,b) then
  1591. list.concat(taicpu.op_reg_const(A_CMN,reg,-a))
  1592. else
  1593. begin
  1594. tmpreg:=getintregister(list,size);
  1595. a_load_const_reg(list,size,a,tmpreg);
  1596. list.concat(taicpu.op_reg_reg(A_CMP,reg,tmpreg));
  1597. end;
  1598. a_jmp_cond(list,cmp_op,l);
  1599. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1600. end;
  1601. procedure tbasecgarm.a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister);
  1602. begin
  1603. if reverse then
  1604. begin
  1605. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,src));
  1606. list.Concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,31));
  1607. list.Concat(taicpu.op_reg_reg_const(A_AND,dst,dst,255));
  1608. end
  1609. { it is decided during the compilation of the system unit if this code is used or not
  1610. so no additional check for rbit is needed }
  1611. else
  1612. begin
  1613. list.Concat(taicpu.op_reg_reg(A_RBIT,dst,src));
  1614. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,dst));
  1615. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1616. list.Concat(taicpu.op_reg_const(A_CMP,dst,32));
  1617. if GenerateThumb2Code then
  1618. list.Concat(taicpu.op_cond(A_IT, C_EQ));
  1619. list.Concat(setcondition(taicpu.op_reg_const(A_MOV,dst,$ff),C_EQ));
  1620. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1621. end;
  1622. end;
  1623. procedure tbasecgarm.a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel);
  1624. begin
  1625. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1626. list.concat(taicpu.op_reg_reg(A_CMP,reg2,reg1));
  1627. a_jmp_cond(list,cmp_op,l);
  1628. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1629. end;
  1630. procedure tbasecgarm.a_jmp_name(list : TAsmList;const s : string);
  1631. var
  1632. ai : taicpu;
  1633. begin
  1634. { generate far jump, leave it to the optimizer to get rid of it }
  1635. if GenerateThumbCode then
  1636. ai:=taicpu.op_sym(A_BL,current_asmdata.RefAsmSymbol(s))
  1637. else
  1638. ai:=taicpu.op_sym(A_B,current_asmdata.RefAsmSymbol(s));
  1639. ai.is_jmp:=true;
  1640. list.concat(ai);
  1641. end;
  1642. procedure tbasecgarm.a_jmp_always(list : TAsmList;l: tasmlabel);
  1643. var
  1644. ai : taicpu;
  1645. begin
  1646. { generate far jump, leave it to the optimizer to get rid of it }
  1647. if GenerateThumbCode then
  1648. ai:=taicpu.op_sym(A_BL,l)
  1649. else
  1650. ai:=taicpu.op_sym(A_B,l);
  1651. ai.is_jmp:=true;
  1652. list.concat(ai);
  1653. end;
  1654. procedure tbasecgarm.a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel);
  1655. var
  1656. ai : taicpu;
  1657. inv_flags : TResFlags;
  1658. hlabel : TAsmLabel;
  1659. begin
  1660. if GenerateThumbCode then
  1661. begin
  1662. inv_flags:=f;
  1663. inverse_flags(inv_flags);
  1664. { the optimizer has to fix this if jump range is sufficient short }
  1665. current_asmdata.getjumplabel(hlabel);
  1666. ai:=setcondition(taicpu.op_sym(A_B,hlabel),flags_to_cond(inv_flags));
  1667. ai.is_jmp:=true;
  1668. list.concat(ai);
  1669. a_jmp_always(list,l);
  1670. a_label(list,hlabel);
  1671. end
  1672. else
  1673. begin
  1674. ai:=setcondition(taicpu.op_sym(A_B,l),flags_to_cond(f));
  1675. ai.is_jmp:=true;
  1676. list.concat(ai);
  1677. end;
  1678. end;
  1679. procedure tbasecgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  1680. begin
  1681. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  1682. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  1683. end;
  1684. procedure tbasecgarm.g_profilecode(list : TAsmList);
  1685. begin
  1686. if target_info.system = system_arm_linux then
  1687. begin
  1688. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R14]));
  1689. a_call_name(list,'__gnu_mcount_nc',false);
  1690. end
  1691. else
  1692. internalerror(2014091201);
  1693. end;
  1694. procedure tbasecgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  1695. var
  1696. ref : treference;
  1697. shift : byte;
  1698. firstfloatreg,lastfloatreg,
  1699. r : byte;
  1700. mmregs,
  1701. regs, saveregs : tcpuregisterset;
  1702. registerarea,
  1703. r7offset,
  1704. stackmisalignment : pint;
  1705. imm1, imm2: DWord;
  1706. stack_parameters : Boolean;
  1707. begin
  1708. LocalSize:=align(LocalSize,4);
  1709. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  1710. { call instruction does not put anything on the stack }
  1711. registerarea:=0;
  1712. tarmprocinfo(current_procinfo).stackpaddingreg:=High(TSuperRegister);
  1713. lastfloatreg:=RS_NO;
  1714. if not(nostackframe) then
  1715. begin
  1716. firstfloatreg:=RS_NO;
  1717. mmregs:=[];
  1718. case current_settings.fputype of
  1719. fpu_fpa,
  1720. fpu_fpa10,
  1721. fpu_fpa11:
  1722. begin
  1723. { save floating point registers? }
  1724. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1725. for r:=RS_F0 to RS_F7 do
  1726. if r in regs then
  1727. begin
  1728. if firstfloatreg=RS_NO then
  1729. firstfloatreg:=r;
  1730. lastfloatreg:=r;
  1731. inc(registerarea,12);
  1732. end;
  1733. end;
  1734. fpu_vfpv2,
  1735. fpu_vfpv3,
  1736. fpu_vfpv3_d16:
  1737. begin;
  1738. mmregs:=rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall);
  1739. end;
  1740. end;
  1741. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1742. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1743. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  1744. { save int registers }
  1745. reference_reset(ref,4);
  1746. ref.index:=NR_STACK_POINTER_REG;
  1747. ref.addressmode:=AM_PREINDEXED;
  1748. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  1749. if not(target_info.system in systems_darwin) then
  1750. begin
  1751. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1752. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1753. begin
  1754. a_reg_alloc(list,NR_R12);
  1755. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  1756. end;
  1757. { the (old) ARM APCS requires saving both the stack pointer (to
  1758. crawl the stack) and the PC (to identify the function this
  1759. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  1760. and R15 -- still needs updating for EABI and Darwin, they don't
  1761. need that }
  1762. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1763. regs:=regs+[RS_FRAME_POINTER_REG,RS_R12,RS_R14,RS_R15]
  1764. else
  1765. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1766. include(regs,RS_R14);
  1767. if regs<>[] then
  1768. begin
  1769. for r:=RS_R0 to RS_R15 do
  1770. if r in regs then
  1771. inc(registerarea,4);
  1772. { if the stack is not 8 byte aligned, try to add an extra register,
  1773. so we can avoid the extra sub/add ...,#4 later (KB) }
  1774. if ((registerarea mod current_settings.alignment.localalignmax) <> 0) then
  1775. for r:=RS_R3 downto RS_R0 do
  1776. if not(r in regs) then
  1777. begin
  1778. regs:=regs+[r];
  1779. inc(registerarea,4);
  1780. tarmprocinfo(current_procinfo).stackpaddingreg:=r;
  1781. break;
  1782. end;
  1783. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  1784. end;
  1785. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1786. begin
  1787. { the framepointer now points to the saved R15, so the saved
  1788. framepointer is at R11-12 (for get_caller_frame) }
  1789. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  1790. a_reg_dealloc(list,NR_R12);
  1791. end;
  1792. end
  1793. else
  1794. begin
  1795. { always save r14 if we use r7 as the framepointer, because
  1796. the parameter offsets are hardcoded in advance and always
  1797. assume that r14 sits on the stack right behind the saved r7
  1798. }
  1799. if current_procinfo.framepointer=NR_FRAME_POINTER_REG then
  1800. include(regs,RS_FRAME_POINTER_REG);
  1801. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1802. include(regs,RS_R14);
  1803. if regs<>[] then
  1804. begin
  1805. { on Darwin, you first have to save [r4-r7,lr], and then
  1806. [r8,r10,r11] and make r7 point to the previously saved
  1807. r7 so that you can perform a stack crawl based on it
  1808. ([r7] is previous stack frame, [r7+4] is return address
  1809. }
  1810. include(regs,RS_FRAME_POINTER_REG);
  1811. saveregs:=regs-[RS_R8,RS_R10,RS_R11];
  1812. r7offset:=0;
  1813. for r:=RS_R0 to RS_R15 do
  1814. if r in saveregs then
  1815. begin
  1816. inc(registerarea,4);
  1817. if r<RS_FRAME_POINTER_REG then
  1818. inc(r7offset,4);
  1819. end;
  1820. { save the registers }
  1821. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1822. { make r7 point to the saved r7 (regardless of whether this
  1823. frame uses the framepointer, for backtrace purposes) }
  1824. if r7offset<>0 then
  1825. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_FRAME_POINTER_REG,NR_R13,r7offset))
  1826. else
  1827. list.concat(taicpu.op_reg_reg(A_MOV,NR_R7,NR_R13));
  1828. { now save the rest (if any) }
  1829. saveregs:=regs-saveregs;
  1830. if saveregs<>[] then
  1831. begin
  1832. for r:=RS_R8 to RS_R11 do
  1833. if r in saveregs then
  1834. inc(registerarea,4);
  1835. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1836. end;
  1837. end;
  1838. end;
  1839. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  1840. if (LocalSize<>0) or
  1841. ((stackmisalignment<>0) and
  1842. ((pi_do_call in current_procinfo.flags) or
  1843. (po_assembler in current_procinfo.procdef.procoptions))) then
  1844. begin
  1845. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  1846. if stack_parameters and (pi_estimatestacksize in current_procinfo.flags) then
  1847. begin
  1848. if localsize>tarmprocinfo(current_procinfo).stackframesize then
  1849. internalerror(2014030901)
  1850. else
  1851. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea;
  1852. end;
  1853. if is_shifter_const(localsize,shift) then
  1854. begin
  1855. a_reg_dealloc(list,NR_R12);
  1856. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  1857. end
  1858. else if split_into_shifter_const(localsize, imm1, imm2) then
  1859. begin
  1860. a_reg_dealloc(list,NR_R12);
  1861. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  1862. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  1863. end
  1864. else
  1865. begin
  1866. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  1867. a_reg_alloc(list,NR_R12);
  1868. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  1869. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  1870. a_reg_dealloc(list,NR_R12);
  1871. end;
  1872. end;
  1873. if (mmregs<>[]) or
  1874. (firstfloatreg<>RS_NO) then
  1875. begin
  1876. reference_reset(ref,4);
  1877. if (tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023) or
  1878. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv3_d16]) then
  1879. begin
  1880. if not is_shifter_const(tarmprocinfo(current_procinfo).floatregstart,shift) then
  1881. begin
  1882. a_reg_alloc(list,NR_R12);
  1883. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  1884. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1885. a_reg_dealloc(list,NR_R12);
  1886. end
  1887. else
  1888. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tarmprocinfo(current_procinfo).floatregstart));
  1889. ref.base:=NR_R12;
  1890. end
  1891. else
  1892. begin
  1893. ref.base:=current_procinfo.framepointer;
  1894. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  1895. end;
  1896. case current_settings.fputype of
  1897. fpu_fpa,
  1898. fpu_fpa10,
  1899. fpu_fpa11:
  1900. begin
  1901. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  1902. lastfloatreg-firstfloatreg+1,ref));
  1903. end;
  1904. fpu_vfpv2,
  1905. fpu_vfpv3,
  1906. fpu_vfpv3_d16:
  1907. begin
  1908. ref.index:=ref.base;
  1909. ref.base:=NR_NO;
  1910. { FSTMX is deprecated on ARMv6 and later }
  1911. {if (current_settings.cputype<cpu_armv6) then
  1912. postfix:=PF_IAX
  1913. else
  1914. postfix:=PF_IAD;}
  1915. list.concat(taicpu.op_ref_regset(A_VSTM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  1916. end;
  1917. end;
  1918. end;
  1919. end;
  1920. end;
  1921. procedure tbasecgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  1922. var
  1923. ref : treference;
  1924. LocalSize : longint;
  1925. firstfloatreg,lastfloatreg,
  1926. r,
  1927. shift : byte;
  1928. mmregs,
  1929. saveregs,
  1930. regs : tcpuregisterset;
  1931. registerarea,
  1932. stackmisalignment: pint;
  1933. paddingreg: TSuperRegister;
  1934. imm1, imm2: DWord;
  1935. begin
  1936. if not(nostackframe) then
  1937. begin
  1938. registerarea:=0;
  1939. firstfloatreg:=RS_NO;
  1940. lastfloatreg:=RS_NO;
  1941. mmregs:=[];
  1942. saveregs:=[];
  1943. case current_settings.fputype of
  1944. fpu_fpa,
  1945. fpu_fpa10,
  1946. fpu_fpa11:
  1947. begin
  1948. { restore floating point registers? }
  1949. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1950. for r:=RS_F0 to RS_F7 do
  1951. if r in regs then
  1952. begin
  1953. if firstfloatreg=RS_NO then
  1954. firstfloatreg:=r;
  1955. lastfloatreg:=r;
  1956. { floating point register space is already included in
  1957. localsize below by calc_stackframe_size
  1958. inc(registerarea,12);
  1959. }
  1960. end;
  1961. end;
  1962. fpu_vfpv2,
  1963. fpu_vfpv3,
  1964. fpu_vfpv3_d16:
  1965. begin;
  1966. { restore vfp registers? }
  1967. mmregs:=rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall);
  1968. end;
  1969. end;
  1970. if (firstfloatreg<>RS_NO) or
  1971. (mmregs<>[]) then
  1972. begin
  1973. reference_reset(ref,4);
  1974. if (tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023) or
  1975. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv3_d16]) then
  1976. begin
  1977. if not is_shifter_const(tarmprocinfo(current_procinfo).floatregstart,shift) then
  1978. begin
  1979. a_reg_alloc(list,NR_R12);
  1980. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  1981. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1982. a_reg_dealloc(list,NR_R12);
  1983. end
  1984. else
  1985. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tarmprocinfo(current_procinfo).floatregstart));
  1986. ref.base:=NR_R12;
  1987. end
  1988. else
  1989. begin
  1990. ref.base:=current_procinfo.framepointer;
  1991. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  1992. end;
  1993. case current_settings.fputype of
  1994. fpu_fpa,
  1995. fpu_fpa10,
  1996. fpu_fpa11:
  1997. begin
  1998. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  1999. lastfloatreg-firstfloatreg+1,ref));
  2000. end;
  2001. fpu_vfpv2,
  2002. fpu_vfpv3,
  2003. fpu_vfpv3_d16:
  2004. begin
  2005. ref.index:=ref.base;
  2006. ref.base:=NR_NO;
  2007. { FLDMX is deprecated on ARMv6 and later }
  2008. {if (current_settings.cputype<cpu_armv6) then
  2009. mmpostfix:=PF_IAX
  2010. else
  2011. mmpostfix:=PF_IAD;}
  2012. list.concat(taicpu.op_ref_regset(A_VLDM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  2013. end;
  2014. end;
  2015. end;
  2016. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  2017. if (pi_do_call in current_procinfo.flags) or
  2018. (regs<>[]) or
  2019. ((target_info.system in systems_darwin) and
  2020. (current_procinfo.framepointer<>NR_STACK_POINTER_REG)) then
  2021. begin
  2022. exclude(regs,RS_R14);
  2023. include(regs,RS_R15);
  2024. if (target_info.system in systems_darwin) then
  2025. include(regs,RS_FRAME_POINTER_REG);
  2026. end;
  2027. if not(target_info.system in systems_darwin) then
  2028. begin
  2029. { restore saved stack pointer to SP (R13) and saved lr to PC (R15).
  2030. The saved PC came after that but is discarded, since we restore
  2031. the stack pointer }
  2032. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  2033. regs:=regs+[RS_FRAME_POINTER_REG,RS_R13,RS_R15];
  2034. end
  2035. else
  2036. begin
  2037. { restore R8-R11 already if necessary (they've been stored
  2038. before the others) }
  2039. saveregs:=regs*[RS_R8,RS_R10,RS_R11];
  2040. if saveregs<>[] then
  2041. begin
  2042. reference_reset(ref,4);
  2043. ref.index:=NR_STACK_POINTER_REG;
  2044. ref.addressmode:=AM_PREINDEXED;
  2045. for r:=RS_R8 to RS_R11 do
  2046. if r in saveregs then
  2047. inc(registerarea,4);
  2048. regs:=regs-saveregs;
  2049. end;
  2050. end;
  2051. for r:=RS_R0 to RS_R15 do
  2052. if r in regs then
  2053. inc(registerarea,4);
  2054. { reapply the stack padding reg, in case there was one, see the complimentary
  2055. comment in g_proc_entry() (KB) }
  2056. paddingreg:=tarmprocinfo(current_procinfo).stackpaddingreg;
  2057. if paddingreg < RS_R4 then
  2058. if paddingreg in regs then
  2059. internalerror(201306190)
  2060. else
  2061. begin
  2062. regs:=regs+[paddingreg];
  2063. inc(registerarea,4);
  2064. end;
  2065. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  2066. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  2067. (target_info.system in systems_darwin) then
  2068. begin
  2069. LocalSize:=current_procinfo.calc_stackframe_size;
  2070. if (LocalSize<>0) or
  2071. ((stackmisalignment<>0) and
  2072. ((pi_do_call in current_procinfo.flags) or
  2073. (po_assembler in current_procinfo.procdef.procoptions))) then
  2074. begin
  2075. if pi_estimatestacksize in current_procinfo.flags then
  2076. LocalSize:=tarmprocinfo(current_procinfo).stackframesize-registerarea
  2077. else
  2078. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  2079. if is_shifter_const(LocalSize,shift) then
  2080. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  2081. else if split_into_shifter_const(localsize, imm1, imm2) then
  2082. begin
  2083. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  2084. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  2085. end
  2086. else
  2087. begin
  2088. a_reg_alloc(list,NR_R12);
  2089. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  2090. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  2091. a_reg_dealloc(list,NR_R12);
  2092. end;
  2093. end;
  2094. if (target_info.system in systems_darwin) and
  2095. (saveregs<>[]) then
  2096. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  2097. if regs=[] then
  2098. begin
  2099. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2100. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2101. else
  2102. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2103. end
  2104. else
  2105. begin
  2106. reference_reset(ref,4);
  2107. ref.index:=NR_STACK_POINTER_REG;
  2108. ref.addressmode:=AM_PREINDEXED;
  2109. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  2110. end;
  2111. end
  2112. else
  2113. begin
  2114. { restore int registers and return }
  2115. reference_reset(ref,4);
  2116. ref.index:=NR_FRAME_POINTER_REG;
  2117. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_EA));
  2118. end;
  2119. end
  2120. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2121. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2122. else
  2123. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2124. end;
  2125. procedure tbasecgarm.g_maybe_got_init(list : TAsmList);
  2126. var
  2127. ref : treference;
  2128. l : TAsmLabel;
  2129. regs : tcpuregisterset;
  2130. r: byte;
  2131. begin
  2132. if (cs_create_pic in current_settings.moduleswitches) and
  2133. (pi_needs_got in current_procinfo.flags) and
  2134. (tf_pic_uses_got in target_info.flags) then
  2135. begin
  2136. { Procedure parametrs are not initialized at this stage.
  2137. Before GOT initialization code, allocate registers used for procedure parameters
  2138. to prevent usage of these registers for temp operations in later stages of code
  2139. generation. }
  2140. regs:=rg[R_INTREGISTER].used_in_proc;
  2141. for r:=RS_R0 to RS_R3 do
  2142. if r in regs then
  2143. a_reg_alloc(list, newreg(R_INTREGISTER,r,R_SUBWHOLE));
  2144. { Allocate scratch register R12 and use it for GOT calculations directly.
  2145. Otherwise the init code can be distorted in later stages of code generation. }
  2146. a_reg_alloc(list,NR_R12);
  2147. reference_reset(ref,4);
  2148. current_asmdata.getglobaldatalabel(l);
  2149. cg.a_label(current_procinfo.aktlocaldata,l);
  2150. ref.symbol:=l;
  2151. ref.base:=NR_PC;
  2152. ref.symboldata:=current_procinfo.aktlocaldata.last;
  2153. list.concat(Taicpu.op_reg_ref(A_LDR,NR_R12,ref));
  2154. current_asmdata.getaddrlabel(l);
  2155. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_32bit,l,current_asmdata.RefAsmSymbol('_GLOBAL_OFFSET_TABLE_'),-8));
  2156. cg.a_label(list,l);
  2157. list.concat(Taicpu.op_reg_reg_reg(A_ADD,NR_R12,NR_PC,NR_R12));
  2158. list.concat(Taicpu.op_reg_reg(A_MOV,current_procinfo.got,NR_R12));
  2159. { Deallocate registers }
  2160. a_reg_dealloc(list,NR_R12);
  2161. for r:=RS_R3 downto RS_R0 do
  2162. if r in regs then
  2163. a_reg_dealloc(list, newreg(R_INTREGISTER,r,R_SUBWHOLE));
  2164. end;
  2165. end;
  2166. procedure tbasecgarm.a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);
  2167. var
  2168. b : byte;
  2169. tmpref : treference;
  2170. instr : taicpu;
  2171. begin
  2172. if ref.addressmode<>AM_OFFSET then
  2173. internalerror(200309071);
  2174. tmpref:=ref;
  2175. { Be sure to have a base register }
  2176. if (tmpref.base=NR_NO) then
  2177. begin
  2178. if tmpref.shiftmode<>SM_None then
  2179. internalerror(2014020702);
  2180. if tmpref.signindex<0 then
  2181. internalerror(200312023);
  2182. tmpref.base:=tmpref.index;
  2183. tmpref.index:=NR_NO;
  2184. end;
  2185. if assigned(tmpref.symbol) or
  2186. not((is_shifter_const(tmpref.offset,b)) or
  2187. (is_shifter_const(-tmpref.offset,b))
  2188. ) then
  2189. fixref(list,tmpref);
  2190. { expect a base here if there is an index }
  2191. if (tmpref.base=NR_NO) and (tmpref.index<>NR_NO) then
  2192. internalerror(200312022);
  2193. if tmpref.index<>NR_NO then
  2194. begin
  2195. if tmpref.shiftmode<>SM_None then
  2196. internalerror(200312021);
  2197. if tmpref.signindex<0 then
  2198. a_op_reg_reg_reg(list,OP_SUB,OS_ADDR,tmpref.base,tmpref.index,r)
  2199. else
  2200. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpref.base,tmpref.index,r);
  2201. if tmpref.offset<>0 then
  2202. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,r,r);
  2203. end
  2204. else
  2205. begin
  2206. if tmpref.base=NR_NO then
  2207. a_load_const_reg(list,OS_ADDR,tmpref.offset,r)
  2208. else
  2209. if tmpref.offset<>0 then
  2210. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,tmpref.base,r)
  2211. else
  2212. begin
  2213. instr:=taicpu.op_reg_reg(A_MOV,r,tmpref.base);
  2214. list.concat(instr);
  2215. add_move_instruction(instr);
  2216. end;
  2217. end;
  2218. end;
  2219. procedure tbasecgarm.fixref(list : TAsmList;var ref : treference);
  2220. var
  2221. tmpreg, tmpreg2 : tregister;
  2222. tmpref : treference;
  2223. l, piclabel : tasmlabel;
  2224. indirection_done : boolean;
  2225. begin
  2226. { absolute symbols can't be handled directly, we've to store the symbol reference
  2227. in the text segment and access it pc relative
  2228. For now, we assume that references where base or index equals to PC are already
  2229. relative, all other references are assumed to be absolute and thus they need
  2230. to be handled extra.
  2231. A proper solution would be to change refoptions to a set and store the information
  2232. if the symbol is absolute or relative there.
  2233. }
  2234. { create consts entry }
  2235. reference_reset(tmpref,4);
  2236. current_asmdata.getjumplabel(l);
  2237. cg.a_label(current_procinfo.aktlocaldata,l);
  2238. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  2239. piclabel:=nil;
  2240. tmpreg:=NR_NO;
  2241. indirection_done:=false;
  2242. if assigned(ref.symbol) then
  2243. begin
  2244. if (target_info.system=system_arm_darwin) and
  2245. (ref.symbol.bind in [AB_EXTERNAL,AB_WEAK_EXTERNAL,AB_PRIVATE_EXTERN,AB_COMMON]) then
  2246. begin
  2247. tmpreg:=g_indirect_sym_load(list,ref.symbol.name,asmsym2indsymflags(ref.symbol));
  2248. if ref.offset<>0 then
  2249. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2250. indirection_done:=true;
  2251. end
  2252. else if (cs_create_pic in current_settings.moduleswitches) then
  2253. if (tf_pic_uses_got in target_info.flags) then
  2254. current_procinfo.aktlocaldata.concat(tai_const.Create_type_sym(aitconst_got,ref.symbol))
  2255. else
  2256. begin
  2257. { ideally, we would want to generate
  2258. ldr r1, LPICConstPool
  2259. LPICLocal:
  2260. ldr/str r2,[pc,r1]
  2261. ...
  2262. LPICConstPool:
  2263. .long _globsym-(LPICLocal+8)
  2264. However, we cannot be sure that the ldr/str will follow
  2265. right after the call to fixref, so we have to load the
  2266. complete address already in a register.
  2267. }
  2268. current_asmdata.getaddrlabel(piclabel);
  2269. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_ptr,piclabel,ref.symbol,ref.offset-8));
  2270. end
  2271. else
  2272. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset))
  2273. end
  2274. else
  2275. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ref.offset));
  2276. { load consts entry }
  2277. if not indirection_done then
  2278. begin
  2279. tmpreg:=getintregister(list,OS_INT);
  2280. tmpref.symbol:=l;
  2281. tmpref.base:=NR_PC;
  2282. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2283. if (cs_create_pic in current_settings.moduleswitches) and
  2284. (tf_pic_uses_got in target_info.flags) and
  2285. assigned(ref.symbol) then
  2286. begin
  2287. reference_reset(tmpref,4);
  2288. tmpref.base:=current_procinfo.got;
  2289. tmpref.index:=tmpreg;
  2290. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2291. if ref.offset<>0 then
  2292. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2293. end;
  2294. end;
  2295. if assigned(piclabel) then
  2296. begin
  2297. cg.a_label(list,piclabel);
  2298. tmpreg2:=getaddressregister(list);
  2299. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpreg,NR_PC,tmpreg2);
  2300. tmpreg:=tmpreg2
  2301. end;
  2302. { This routine can be called with PC as base/index in case the offset
  2303. was too large to encode in a load/store. In that case, the entire
  2304. absolute expression has been re-encoded in a new constpool entry, and
  2305. we have to remove the use of PC from the original reference (the code
  2306. above made everything relative to the value loaded from the new
  2307. constpool entry) }
  2308. if is_pc(ref.base) then
  2309. ref.base:=NR_NO;
  2310. if is_pc(ref.index) then
  2311. ref.index:=NR_NO;
  2312. if (ref.base<>NR_NO) then
  2313. begin
  2314. if ref.index<>NR_NO then
  2315. begin
  2316. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  2317. ref.base:=tmpreg;
  2318. end
  2319. else
  2320. if ref.base<>NR_PC then
  2321. begin
  2322. ref.index:=tmpreg;
  2323. ref.shiftimm:=0;
  2324. ref.signindex:=1;
  2325. ref.shiftmode:=SM_None;
  2326. end
  2327. else
  2328. ref.base:=tmpreg;
  2329. end
  2330. else
  2331. ref.base:=tmpreg;
  2332. ref.offset:=0;
  2333. ref.symbol:=nil;
  2334. end;
  2335. procedure tbasecgarm.g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  2336. var
  2337. paraloc1,paraloc2,paraloc3 : TCGPara;
  2338. pd : tprocdef;
  2339. begin
  2340. pd:=search_system_proc('MOVE');
  2341. paraloc1.init;
  2342. paraloc2.init;
  2343. paraloc3.init;
  2344. paramanager.getintparaloc(list,pd,1,paraloc1);
  2345. paramanager.getintparaloc(list,pd,2,paraloc2);
  2346. paramanager.getintparaloc(list,pd,3,paraloc3);
  2347. a_load_const_cgpara(list,OS_SINT,len,paraloc3);
  2348. a_loadaddr_ref_cgpara(list,dest,paraloc2);
  2349. a_loadaddr_ref_cgpara(list,source,paraloc1);
  2350. paramanager.freecgpara(list,paraloc3);
  2351. paramanager.freecgpara(list,paraloc2);
  2352. paramanager.freecgpara(list,paraloc1);
  2353. alloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2354. alloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2355. a_call_name(list,'FPC_MOVE',false);
  2356. dealloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2357. dealloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2358. paraloc3.done;
  2359. paraloc2.done;
  2360. paraloc1.done;
  2361. end;
  2362. procedure tbasecgarm.g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  2363. const
  2364. maxtmpreg_arm = 10; {roozbeh: can be reduced to 8 or lower if might conflick with reserved ones,also +2 is used becouse of regs required for referencing}
  2365. maxtmpreg_thumb = 5;
  2366. var
  2367. srcref,dstref,usedtmpref,usedtmpref2:treference;
  2368. srcreg,destreg,countreg,r,tmpreg:tregister;
  2369. helpsize:aint;
  2370. copysize:byte;
  2371. cgsize:Tcgsize;
  2372. tmpregisters:array[1..maxtmpreg_arm] of tregister;
  2373. maxtmpreg,
  2374. tmpregi,tmpregi2:byte;
  2375. { will never be called with count<=4 }
  2376. procedure genloop(count : aword;size : byte);
  2377. const
  2378. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2379. var
  2380. l : tasmlabel;
  2381. begin
  2382. current_asmdata.getjumplabel(l);
  2383. if count<size then size:=1;
  2384. a_load_const_reg(list,OS_INT,count div size,countreg);
  2385. cg.a_label(list,l);
  2386. srcref.addressmode:=AM_POSTINDEXED;
  2387. dstref.addressmode:=AM_POSTINDEXED;
  2388. srcref.offset:=size;
  2389. dstref.offset:=size;
  2390. r:=getintregister(list,size2opsize[size]);
  2391. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2392. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2393. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1),PF_S));
  2394. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2395. a_jmp_flags(list,F_NE,l);
  2396. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2397. srcref.offset:=1;
  2398. dstref.offset:=1;
  2399. case count mod size of
  2400. 1:
  2401. begin
  2402. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2403. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2404. end;
  2405. 2:
  2406. if aligned then
  2407. begin
  2408. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2409. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2410. end
  2411. else
  2412. begin
  2413. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2414. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2415. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2416. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2417. end;
  2418. 3:
  2419. if aligned then
  2420. begin
  2421. srcref.offset:=2;
  2422. dstref.offset:=2;
  2423. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2424. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2425. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2426. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2427. end
  2428. else
  2429. begin
  2430. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2431. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2432. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2433. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2434. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2435. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2436. end;
  2437. end;
  2438. { keep the registers alive }
  2439. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2440. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2441. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2442. end;
  2443. { will never be called with count<=4 }
  2444. procedure genloop_thumb(count : aword;size : byte);
  2445. procedure refincofs(const ref : treference;const value : longint = 1);
  2446. begin
  2447. a_op_const_reg(list,OP_ADD,OS_ADDR,value,ref.base);
  2448. end;
  2449. const
  2450. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2451. var
  2452. l : tasmlabel;
  2453. begin
  2454. current_asmdata.getjumplabel(l);
  2455. if count<size then size:=1;
  2456. a_load_const_reg(list,OS_INT,count div size,countreg);
  2457. cg.a_label(list,l);
  2458. r:=getintregister(list,size2opsize[size]);
  2459. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2460. refincofs(srcref);
  2461. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2462. refincofs(dstref);
  2463. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2464. list.concat(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1));
  2465. a_jmp_flags(list,F_NE,l);
  2466. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2467. case count mod size of
  2468. 1:
  2469. begin
  2470. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2471. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2472. end;
  2473. 2:
  2474. if aligned then
  2475. begin
  2476. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2477. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2478. end
  2479. else
  2480. begin
  2481. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2482. refincofs(srcref);
  2483. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2484. refincofs(dstref);
  2485. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2486. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2487. end;
  2488. 3:
  2489. if aligned then
  2490. begin
  2491. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2492. refincofs(srcref,2);
  2493. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2494. refincofs(dstref,2);
  2495. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2496. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2497. end
  2498. else
  2499. begin
  2500. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2501. refincofs(srcref);
  2502. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2503. refincofs(dstref);
  2504. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2505. refincofs(srcref);
  2506. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2507. refincofs(dstref);
  2508. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2509. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2510. end;
  2511. end;
  2512. { keep the registers alive }
  2513. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2514. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2515. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2516. end;
  2517. begin
  2518. if len=0 then
  2519. exit;
  2520. if GenerateThumbCode then
  2521. maxtmpreg:=maxtmpreg_thumb
  2522. else
  2523. maxtmpreg:=maxtmpreg_arm;
  2524. helpsize:=12+maxtmpreg*4;//52 with maxtmpreg=10
  2525. dstref:=dest;
  2526. srcref:=source;
  2527. if cs_opt_size in current_settings.optimizerswitches then
  2528. helpsize:=8;
  2529. if aligned and (len=4) then
  2530. begin
  2531. tmpreg:=getintregister(list,OS_32);
  2532. a_load_ref_reg(list,OS_32,OS_32,source,tmpreg);
  2533. a_load_reg_ref(list,OS_32,OS_32,tmpreg,dest);
  2534. end
  2535. else if aligned and (len=2) then
  2536. begin
  2537. tmpreg:=getintregister(list,OS_16);
  2538. a_load_ref_reg(list,OS_16,OS_16,source,tmpreg);
  2539. a_load_reg_ref(list,OS_16,OS_16,tmpreg,dest);
  2540. end
  2541. else if (len<=helpsize) and aligned then
  2542. begin
  2543. tmpregi:=0;
  2544. srcreg:=getintregister(list,OS_ADDR);
  2545. { explicit pc relative addressing, could be
  2546. e.g. a floating point constant }
  2547. if source.base=NR_PC then
  2548. begin
  2549. { ... then we don't need a loadaddr }
  2550. srcref:=source;
  2551. end
  2552. else
  2553. begin
  2554. a_loadaddr_ref_reg(list,source,srcreg);
  2555. reference_reset_base(srcref,srcreg,0,source.alignment);
  2556. end;
  2557. while (len div 4 <> 0) and (tmpregi<maxtmpreg) do
  2558. begin
  2559. inc(tmpregi);
  2560. tmpregisters[tmpregi]:=getintregister(list,OS_32);
  2561. a_load_ref_reg(list,OS_32,OS_32,srcref,tmpregisters[tmpregi]);
  2562. inc(srcref.offset,4);
  2563. dec(len,4);
  2564. end;
  2565. destreg:=getintregister(list,OS_ADDR);
  2566. a_loadaddr_ref_reg(list,dest,destreg);
  2567. reference_reset_base(dstref,destreg,0,dest.alignment);
  2568. tmpregi2:=1;
  2569. while (tmpregi2<=tmpregi) do
  2570. begin
  2571. a_load_reg_ref(list,OS_32,OS_32,tmpregisters[tmpregi2],dstref);
  2572. inc(dstref.offset,4);
  2573. inc(tmpregi2);
  2574. end;
  2575. copysize:=4;
  2576. cgsize:=OS_32;
  2577. while len<>0 do
  2578. begin
  2579. if len<2 then
  2580. begin
  2581. copysize:=1;
  2582. cgsize:=OS_8;
  2583. end
  2584. else if len<4 then
  2585. begin
  2586. copysize:=2;
  2587. cgsize:=OS_16;
  2588. end;
  2589. dec(len,copysize);
  2590. r:=getintregister(list,cgsize);
  2591. a_load_ref_reg(list,cgsize,cgsize,srcref,r);
  2592. a_load_reg_ref(list,cgsize,cgsize,r,dstref);
  2593. inc(srcref.offset,copysize);
  2594. inc(dstref.offset,copysize);
  2595. end;{end of while}
  2596. end
  2597. else
  2598. begin
  2599. cgsize:=OS_32;
  2600. if (len<=4) then{len<=4 and not aligned}
  2601. begin
  2602. r:=getintregister(list,cgsize);
  2603. usedtmpref:=a_internal_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2604. if Len=1 then
  2605. a_load_reg_ref(list,OS_8,OS_8,r,dstref)
  2606. else
  2607. begin
  2608. tmpreg:=getintregister(list,cgsize);
  2609. usedtmpref2:=a_internal_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2610. inc(usedtmpref.offset,1);
  2611. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2612. inc(usedtmpref2.offset,1);
  2613. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2614. if len>2 then
  2615. begin
  2616. inc(usedtmpref.offset,1);
  2617. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2618. inc(usedtmpref2.offset,1);
  2619. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2620. if len>3 then
  2621. begin
  2622. inc(usedtmpref.offset,1);
  2623. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2624. inc(usedtmpref2.offset,1);
  2625. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2626. end;
  2627. end;
  2628. end;
  2629. end{end of if len<=4}
  2630. else
  2631. begin{unaligned & 4<len<helpsize **or** aligned/unaligned & len>helpsize}
  2632. destreg:=getintregister(list,OS_ADDR);
  2633. a_loadaddr_ref_reg(list,dest,destreg);
  2634. reference_reset_base(dstref,destreg,0,dest.alignment);
  2635. srcreg:=getintregister(list,OS_ADDR);
  2636. a_loadaddr_ref_reg(list,source,srcreg);
  2637. reference_reset_base(srcref,srcreg,0,source.alignment);
  2638. countreg:=getintregister(list,OS_32);
  2639. // if cs_opt_size in current_settings.optimizerswitches then
  2640. { roozbeh : it seems loading 1 byte is faster becouse of caching/fetching(?) }
  2641. {if aligned then
  2642. genloop(len,4)
  2643. else}
  2644. if GenerateThumbCode then
  2645. genloop_thumb(len,1)
  2646. else
  2647. genloop(len,1);
  2648. end;
  2649. end;
  2650. end;
  2651. procedure tbasecgarm.g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);
  2652. begin
  2653. g_concatcopy_internal(list,source,dest,len,false);
  2654. end;
  2655. procedure tbasecgarm.g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);
  2656. begin
  2657. if (source.alignment in [1,3]) or
  2658. (dest.alignment in [1,3]) then
  2659. g_concatcopy_internal(list,source,dest,len,false)
  2660. else
  2661. g_concatcopy_internal(list,source,dest,len,true);
  2662. end;
  2663. procedure tbasecgarm.g_overflowCheck(list : TAsmList;const l : tlocation;def : tdef);
  2664. var
  2665. ovloc : tlocation;
  2666. begin
  2667. ovloc.loc:=LOC_VOID;
  2668. g_overflowCheck_loc(list,l,def,ovloc);
  2669. end;
  2670. procedure tbasecgarm.g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);
  2671. var
  2672. hl : tasmlabel;
  2673. ai:TAiCpu;
  2674. hflags : tresflags;
  2675. begin
  2676. if not(cs_check_overflow in current_settings.localswitches) then
  2677. exit;
  2678. current_asmdata.getjumplabel(hl);
  2679. case ovloc.loc of
  2680. LOC_VOID:
  2681. begin
  2682. ai:=taicpu.op_sym(A_B,hl);
  2683. ai.is_jmp:=true;
  2684. if not((def.typ=pointerdef) or
  2685. ((def.typ=orddef) and
  2686. (torddef(def).ordtype in [u64bit,u16bit,u32bit,u8bit,uchar,
  2687. pasbool8,pasbool16,pasbool32,pasbool64]))) then
  2688. ai.SetCondition(C_VC)
  2689. else
  2690. if TAiCpu(List.Last).opcode in [A_RSB,A_RSC,A_SBC,A_SUB] then
  2691. ai.SetCondition(C_CS)
  2692. else
  2693. ai.SetCondition(C_CC);
  2694. list.concat(ai);
  2695. end;
  2696. LOC_FLAGS:
  2697. begin
  2698. hflags:=ovloc.resflags;
  2699. inverse_flags(hflags);
  2700. cg.a_jmp_flags(list,hflags,hl);
  2701. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2702. end;
  2703. else
  2704. internalerror(200409281);
  2705. end;
  2706. a_call_name(list,'FPC_OVERFLOW',false);
  2707. a_label(list,hl);
  2708. end;
  2709. procedure tbasecgarm.g_save_registers(list : TAsmList);
  2710. begin
  2711. { this work is done in g_proc_entry }
  2712. end;
  2713. procedure tbasecgarm.g_restore_registers(list : TAsmList);
  2714. begin
  2715. { this work is done in g_proc_exit }
  2716. end;
  2717. procedure tbasecgarm.a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  2718. var
  2719. ai : taicpu;
  2720. hlabel : TAsmLabel;
  2721. begin
  2722. if GenerateThumbCode then
  2723. begin
  2724. { the optimizer has to fix this if jump range is sufficient short }
  2725. current_asmdata.getjumplabel(hlabel);
  2726. ai:=Taicpu.Op_sym(A_B,hlabel);
  2727. ai.SetCondition(inverse_cond(OpCmp2AsmCond[cond]));
  2728. ai.is_jmp:=true;
  2729. list.concat(ai);
  2730. a_jmp_always(list,l);
  2731. a_label(list,hlabel);
  2732. end
  2733. else
  2734. begin
  2735. ai:=Taicpu.Op_sym(A_B,l);
  2736. ai.SetCondition(OpCmp2AsmCond[cond]);
  2737. ai.is_jmp:=true;
  2738. list.concat(ai);
  2739. end;
  2740. end;
  2741. function get_scalar_mm_op(fromsize,tosize : tcgsize) : tasmop;
  2742. const
  2743. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of tasmop = (
  2744. (A_VMOV,A_VCVT,A_NONE,A_NONE,A_NONE),
  2745. (A_VCVT,A_VMOV,A_NONE,A_NONE,A_NONE),
  2746. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2747. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2748. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE));
  2749. begin
  2750. result:=convertop[fromsize,tosize];
  2751. if result=A_NONE then
  2752. internalerror(200312205);
  2753. end;
  2754. function get_scalar_mm_prefix(fromsize,tosize : tcgsize) : TOpPostfix;
  2755. const
  2756. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of TOpPostfix = (
  2757. (PF_F32, PF_F32F64,PF_None,PF_None,PF_None),
  2758. (PF_F64F32,PF_F64, PF_None,PF_None,PF_None),
  2759. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2760. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2761. (PF_None, PF_None, PF_None,PF_None,PF_None));
  2762. begin
  2763. result:=convertop[fromsize,tosize];
  2764. end;
  2765. procedure tbasecgarm.a_loadmm_reg_reg(list: tasmlist; fromsize,tosize: tcgsize; reg1,reg2: tregister; shuffle: pmmshuffle);
  2766. var
  2767. instr: taicpu;
  2768. begin
  2769. if (shuffle=nil) or shufflescalar(shuffle) then
  2770. instr:=setoppostfix(taicpu.op_reg_reg(get_scalar_mm_op(tosize,fromsize),reg2,reg1),get_scalar_mm_prefix(tosize,fromsize))
  2771. else
  2772. internalerror(2009112407);
  2773. list.concat(instr);
  2774. case instr.opcode of
  2775. A_VMOV:
  2776. add_move_instruction(instr);
  2777. end;
  2778. end;
  2779. procedure tbasecgarm.a_loadmm_ref_reg(list: tasmlist; fromsize,tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  2780. var
  2781. intreg,
  2782. tmpmmreg : tregister;
  2783. reg64 : tregister64;
  2784. begin
  2785. if assigned(shuffle) and
  2786. not(shufflescalar(shuffle)) then
  2787. internalerror(2009112413);
  2788. case fromsize of
  2789. OS_32,OS_S32:
  2790. begin
  2791. fromsize:=OS_F32;
  2792. { since we are loading an integer, no conversion may be required }
  2793. if (fromsize<>tosize) then
  2794. internalerror(2009112801);
  2795. end;
  2796. OS_64,OS_S64:
  2797. begin
  2798. fromsize:=OS_F64;
  2799. { since we are loading an integer, no conversion may be required }
  2800. if (fromsize<>tosize) then
  2801. internalerror(2009112901);
  2802. end;
  2803. end;
  2804. if (fromsize<>tosize) then
  2805. tmpmmreg:=getmmregister(list,fromsize)
  2806. else
  2807. tmpmmreg:=reg;
  2808. if (ref.alignment in [1,2]) then
  2809. begin
  2810. case fromsize of
  2811. OS_F32:
  2812. begin
  2813. intreg:=getintregister(list,OS_32);
  2814. a_load_ref_reg(list,OS_32,OS_32,ref,intreg);
  2815. a_loadmm_intreg_reg(list,OS_32,OS_F32,intreg,tmpmmreg,mms_movescalar);
  2816. end;
  2817. OS_F64:
  2818. begin
  2819. reg64.reglo:=getintregister(list,OS_32);
  2820. reg64.reghi:=getintregister(list,OS_32);
  2821. cg64.a_load64_ref_reg(list,ref,reg64);
  2822. cg64.a_loadmm_intreg64_reg(list,OS_F64,reg64,tmpmmreg);
  2823. end;
  2824. else
  2825. internalerror(2009112412);
  2826. end;
  2827. end
  2828. else
  2829. begin
  2830. handle_load_store(list,A_VLDR,PF_None,tmpmmreg,ref);
  2831. end;
  2832. if (tmpmmreg<>reg) then
  2833. a_loadmm_reg_reg(list,fromsize,tosize,tmpmmreg,reg,shuffle);
  2834. end;
  2835. procedure tbasecgarm.a_loadmm_reg_ref(list: tasmlist; fromsize,tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  2836. var
  2837. intreg,
  2838. tmpmmreg : tregister;
  2839. reg64 : tregister64;
  2840. begin
  2841. if assigned(shuffle) and
  2842. not(shufflescalar(shuffle)) then
  2843. internalerror(2009112416);
  2844. case tosize of
  2845. OS_32,OS_S32:
  2846. begin
  2847. tosize:=OS_F32;
  2848. { since we are loading an integer, no conversion may be required }
  2849. if (fromsize<>tosize) then
  2850. internalerror(2009112801);
  2851. end;
  2852. OS_64,OS_S64:
  2853. begin
  2854. tosize:=OS_F64;
  2855. { since we are loading an integer, no conversion may be required }
  2856. if (fromsize<>tosize) then
  2857. internalerror(2009112901);
  2858. end;
  2859. end;
  2860. if (fromsize<>tosize) then
  2861. begin
  2862. tmpmmreg:=getmmregister(list,tosize);
  2863. a_loadmm_reg_reg(list,fromsize,tosize,reg,tmpmmreg,shuffle);
  2864. end
  2865. else
  2866. tmpmmreg:=reg;
  2867. if (ref.alignment in [1,2]) then
  2868. begin
  2869. case tosize of
  2870. OS_F32:
  2871. begin
  2872. intreg:=getintregister(list,OS_32);
  2873. a_loadmm_reg_intreg(list,OS_F32,OS_32,tmpmmreg,intreg,shuffle);
  2874. a_load_reg_ref(list,OS_32,OS_32,intreg,ref);
  2875. end;
  2876. OS_F64:
  2877. begin
  2878. reg64.reglo:=getintregister(list,OS_32);
  2879. reg64.reghi:=getintregister(list,OS_32);
  2880. cg64.a_loadmm_reg_intreg64(list,OS_F64,tmpmmreg,reg64);
  2881. cg64.a_load64_reg_ref(list,reg64,ref);
  2882. end;
  2883. else
  2884. internalerror(2009112417);
  2885. end;
  2886. end
  2887. else
  2888. begin
  2889. handle_load_store(list,A_VSTR,PF_None,tmpmmreg,ref);
  2890. end;
  2891. end;
  2892. procedure tbasecgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  2893. begin
  2894. { this code can only be used to transfer raw data, not to perform
  2895. conversions }
  2896. if (tosize<>OS_F32) then
  2897. internalerror(2009112419);
  2898. if not(fromsize in [OS_32,OS_S32]) then
  2899. internalerror(2009112420);
  2900. if assigned(shuffle) and
  2901. not shufflescalar(shuffle) then
  2902. internalerror(2009112516);
  2903. list.concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg));
  2904. end;
  2905. procedure tbasecgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize; mmreg, intreg: tregister;shuffle : pmmshuffle);
  2906. begin
  2907. { this code can only be used to transfer raw data, not to perform
  2908. conversions }
  2909. if (fromsize<>OS_F32) then
  2910. internalerror(2009112430);
  2911. if not(tosize in [OS_32,OS_S32]) then
  2912. internalerror(2009112420);
  2913. if assigned(shuffle) and
  2914. not shufflescalar(shuffle) then
  2915. internalerror(2009112514);
  2916. list.concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg));
  2917. end;
  2918. procedure tbasecgarm.a_opmm_reg_reg(list: tasmlist; op: topcg; size: tcgsize; src, dst: tregister; shuffle: pmmshuffle);
  2919. var
  2920. tmpreg: tregister;
  2921. begin
  2922. { the vfp doesn't support xor nor any other logical operation, but
  2923. this routine is used to initialise global mm regvars. We can
  2924. easily initialise an mm reg with 0 though. }
  2925. case op of
  2926. OP_XOR:
  2927. begin
  2928. if (src<>dst) or
  2929. (reg_cgsize(src)<>size) or
  2930. assigned(shuffle) then
  2931. internalerror(2009112907);
  2932. tmpreg:=getintregister(list,OS_32);
  2933. a_load_const_reg(list,OS_32,0,tmpreg);
  2934. case size of
  2935. OS_F32:
  2936. list.concat(taicpu.op_reg_reg(A_VMOV,dst,tmpreg));
  2937. OS_F64:
  2938. list.concat(taicpu.op_reg_reg_reg(A_VMOV,dst,tmpreg,tmpreg));
  2939. else
  2940. internalerror(2009112908);
  2941. end;
  2942. end
  2943. else
  2944. internalerror(2009112906);
  2945. end;
  2946. end;
  2947. procedure tbasecgarm.maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  2948. const
  2949. overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NEG];
  2950. begin
  2951. if (op in overflowops) and
  2952. (size in [OS_8,OS_S8,OS_16,OS_S16]) then
  2953. a_load_reg_reg(list,OS_32,size,dst,dst);
  2954. end;
  2955. procedure tbasecgarm.safe_mla(list : TAsmList; op1,op2,op3,op4 : TRegister);
  2956. procedure checkreg(var reg : TRegister);
  2957. var
  2958. tmpreg : TRegister;
  2959. begin
  2960. if ((GenerateThumbCode or GenerateThumb2Code) and (getsupreg(reg)=RS_R13)) or
  2961. (getsupreg(reg)=RS_R15) then
  2962. begin
  2963. tmpreg:=getintregister(list,OS_INT);
  2964. a_load_reg_reg(list,OS_INT,OS_INT,reg,tmpreg);
  2965. reg:=tmpreg;
  2966. end;
  2967. end;
  2968. begin
  2969. checkreg(op1);
  2970. checkreg(op2);
  2971. checkreg(op3);
  2972. checkreg(op4);
  2973. list.concat(taicpu.op_reg_reg_reg_reg(A_MLA,op1,op2,op3,op4));
  2974. end;
  2975. procedure tcg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  2976. begin
  2977. case op of
  2978. OP_NEG:
  2979. begin
  2980. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2981. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  2982. list.concat(taicpu.op_reg_reg_const(A_RSC,regdst.reghi,regsrc.reghi,0));
  2983. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2984. end;
  2985. OP_NOT:
  2986. begin
  2987. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  2988. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  2989. end;
  2990. else
  2991. a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);
  2992. end;
  2993. end;
  2994. procedure tcg64farm.a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);
  2995. begin
  2996. a_op64_const_reg_reg(list,op,size,value,reg,reg);
  2997. end;
  2998. procedure tcg64farm.a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);
  2999. var
  3000. ovloc : tlocation;
  3001. begin
  3002. a_op64_const_reg_reg_checkoverflow(list,op,size,value,regsrc,regdst,false,ovloc);
  3003. end;
  3004. procedure tcg64farm.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);
  3005. var
  3006. ovloc : tlocation;
  3007. begin
  3008. a_op64_reg_reg_reg_checkoverflow(list,op,size,regsrc1,regsrc2,regdst,false,ovloc);
  3009. end;
  3010. procedure tcg64farm.a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);
  3011. begin
  3012. { this code can only be used to transfer raw data, not to perform
  3013. conversions }
  3014. if (mmsize<>OS_F64) then
  3015. internalerror(2009112405);
  3016. list.concat(taicpu.op_reg_reg_reg(A_VMOV,mmreg,intreg.reglo,intreg.reghi));
  3017. end;
  3018. procedure tcg64farm.a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);
  3019. begin
  3020. { this code can only be used to transfer raw data, not to perform
  3021. conversions }
  3022. if (mmsize<>OS_F64) then
  3023. internalerror(2009112406);
  3024. list.concat(taicpu.op_reg_reg_reg(A_VMOV,intreg.reglo,intreg.reghi,mmreg));
  3025. end;
  3026. procedure tcg64farm.a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3027. var
  3028. tmpreg : tregister;
  3029. b : byte;
  3030. begin
  3031. ovloc.loc:=LOC_VOID;
  3032. case op of
  3033. OP_NEG,
  3034. OP_NOT :
  3035. internalerror(2012022501);
  3036. end;
  3037. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3038. begin
  3039. case op of
  3040. OP_ADD:
  3041. begin
  3042. if is_shifter_const(lo(value),b) then
  3043. begin
  3044. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3045. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3046. end
  3047. else
  3048. begin
  3049. tmpreg:=cg.getintregister(list,OS_32);
  3050. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3051. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3052. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3053. end;
  3054. if is_shifter_const(hi(value),b) then
  3055. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,hi(value)),PF_S))
  3056. else
  3057. begin
  3058. tmpreg:=cg.getintregister(list,OS_32);
  3059. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3060. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3061. end;
  3062. end;
  3063. OP_SUB:
  3064. begin
  3065. if is_shifter_const(lo(value),b) then
  3066. begin
  3067. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3068. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3069. end
  3070. else
  3071. begin
  3072. tmpreg:=cg.getintregister(list,OS_32);
  3073. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3074. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3075. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3076. end;
  3077. if is_shifter_const(hi(value),b) then
  3078. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))),PF_S))
  3079. else
  3080. begin
  3081. tmpreg:=cg.getintregister(list,OS_32);
  3082. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3083. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3084. end;
  3085. end;
  3086. else
  3087. internalerror(200502131);
  3088. end;
  3089. if size=OS_64 then
  3090. begin
  3091. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3092. ovloc.loc:=LOC_FLAGS;
  3093. case op of
  3094. OP_ADD:
  3095. ovloc.resflags:=F_CS;
  3096. OP_SUB:
  3097. ovloc.resflags:=F_CC;
  3098. end;
  3099. end;
  3100. end
  3101. else
  3102. begin
  3103. case op of
  3104. OP_AND,OP_OR,OP_XOR:
  3105. begin
  3106. cg.a_op_const_reg_reg(list,op,OS_32,aint(lo(value)),regsrc.reglo,regdst.reglo);
  3107. cg.a_op_const_reg_reg(list,op,OS_32,aint(hi(value)),regsrc.reghi,regdst.reghi);
  3108. end;
  3109. OP_ADD:
  3110. begin
  3111. if is_shifter_const(aint(lo(value)),b) then
  3112. begin
  3113. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3114. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3115. end
  3116. else
  3117. begin
  3118. tmpreg:=cg.getintregister(list,OS_32);
  3119. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3120. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3121. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3122. end;
  3123. if is_shifter_const(aint(hi(value)),b) then
  3124. list.concat(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3125. else
  3126. begin
  3127. tmpreg:=cg.getintregister(list,OS_32);
  3128. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  3129. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg));
  3130. end;
  3131. end;
  3132. OP_SUB:
  3133. begin
  3134. if is_shifter_const(aint(lo(value)),b) then
  3135. begin
  3136. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3137. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3138. end
  3139. else
  3140. begin
  3141. tmpreg:=cg.getintregister(list,OS_32);
  3142. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3143. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3144. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3145. end;
  3146. if is_shifter_const(aint(hi(value)),b) then
  3147. list.concat(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3148. else
  3149. begin
  3150. tmpreg:=cg.getintregister(list,OS_32);
  3151. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3152. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg));
  3153. end;
  3154. end;
  3155. else
  3156. internalerror(2003083101);
  3157. end;
  3158. end;
  3159. end;
  3160. procedure tcg64farm.a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3161. begin
  3162. ovloc.loc:=LOC_VOID;
  3163. case op of
  3164. OP_NEG,
  3165. OP_NOT :
  3166. internalerror(2012022502);
  3167. end;
  3168. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3169. begin
  3170. case op of
  3171. OP_ADD:
  3172. begin
  3173. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3174. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3175. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi),PF_S));
  3176. end;
  3177. OP_SUB:
  3178. begin
  3179. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3180. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3181. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi),PF_S));
  3182. end;
  3183. else
  3184. internalerror(2003083101);
  3185. end;
  3186. if size=OS_64 then
  3187. begin
  3188. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3189. ovloc.loc:=LOC_FLAGS;
  3190. case op of
  3191. OP_ADD:
  3192. ovloc.resflags:=F_CS;
  3193. OP_SUB:
  3194. ovloc.resflags:=F_CC;
  3195. end;
  3196. end;
  3197. end
  3198. else
  3199. begin
  3200. case op of
  3201. OP_AND,OP_OR,OP_XOR:
  3202. begin
  3203. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);
  3204. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);
  3205. end;
  3206. OP_ADD:
  3207. begin
  3208. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3209. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3210. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi));
  3211. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3212. end;
  3213. OP_SUB:
  3214. begin
  3215. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3216. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3217. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi));
  3218. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3219. end;
  3220. else
  3221. internalerror(2003083101);
  3222. end;
  3223. end;
  3224. end;
  3225. procedure tthumbcgarm.init_register_allocators;
  3226. begin
  3227. inherited init_register_allocators;
  3228. if assigned(current_procinfo) and (current_procinfo.framepointer=NR_R7) then
  3229. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3230. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6],first_int_imreg,[])
  3231. else
  3232. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3233. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7],first_int_imreg,[]);
  3234. end;
  3235. procedure tthumbcgarm.done_register_allocators;
  3236. begin
  3237. rg[R_INTREGISTER].free;
  3238. rg[R_FPUREGISTER].free;
  3239. rg[R_MMREGISTER].free;
  3240. inherited done_register_allocators;
  3241. end;
  3242. procedure tthumbcgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  3243. var
  3244. ref : treference;
  3245. r : byte;
  3246. regs : tcpuregisterset;
  3247. stackmisalignment : pint;
  3248. registerarea: DWord;
  3249. stack_parameters: Boolean;
  3250. begin
  3251. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3252. LocalSize:=align(LocalSize,4);
  3253. { call instruction does not put anything on the stack }
  3254. stackmisalignment:=0;
  3255. if not(nostackframe) then
  3256. begin
  3257. a_reg_alloc(list,NR_STACK_POINTER_REG);
  3258. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3259. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  3260. { save int registers }
  3261. reference_reset(ref,4);
  3262. ref.index:=NR_STACK_POINTER_REG;
  3263. ref.addressmode:=AM_PREINDEXED;
  3264. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3265. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3266. begin
  3267. //!!!! a_reg_alloc(list,NR_R12);
  3268. //!!!! list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  3269. end;
  3270. { the (old) ARM APCS requires saving both the stack pointer (to
  3271. crawl the stack) and the PC (to identify the function this
  3272. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  3273. and R15 -- still needs updating for EABI and Darwin, they don't
  3274. need that }
  3275. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3276. regs:=regs+[RS_R7,RS_R14]
  3277. else
  3278. // if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  3279. include(regs,RS_R14);
  3280. { safely estimate stack size }
  3281. if localsize+current_settings.alignment.localalignmax+4>508 then
  3282. begin
  3283. include(rg[R_INTREGISTER].used_in_proc,RS_R4);
  3284. include(regs,RS_R4);
  3285. end;
  3286. registerarea:=0;
  3287. if regs<>[] then
  3288. begin
  3289. for r:=RS_R0 to RS_R15 do
  3290. if r in regs then
  3291. inc(registerarea,4);
  3292. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,regs));
  3293. end;
  3294. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3295. if stack_parameters or (LocalSize<>0) or
  3296. ((stackmisalignment<>0) and
  3297. ((pi_do_call in current_procinfo.flags) or
  3298. (po_assembler in current_procinfo.procdef.procoptions))) then
  3299. begin
  3300. { do we access stack parameters?
  3301. if yes, the previously estimated stacksize must be used }
  3302. if stack_parameters then
  3303. begin
  3304. if localsize>tarmprocinfo(current_procinfo).stackframesize then
  3305. begin
  3306. writeln(localsize);
  3307. writeln(tarmprocinfo(current_procinfo).stackframesize);
  3308. internalerror(2013040601);
  3309. end
  3310. else
  3311. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea;
  3312. end
  3313. else
  3314. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3315. if localsize<508 then
  3316. begin
  3317. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  3318. end
  3319. else if localsize<=1016 then
  3320. begin
  3321. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3322. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize-508));
  3323. end
  3324. else
  3325. begin
  3326. a_load_const_reg(list,OS_ADDR,-localsize,NR_R4);
  3327. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R4));
  3328. include(regs,RS_R4);
  3329. //!!!! if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  3330. //!!!! a_reg_alloc(list,NR_R12);
  3331. //!!!! a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  3332. //!!!! list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  3333. //!!!! a_reg_dealloc(list,NR_R12);
  3334. end;
  3335. end;
  3336. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3337. begin
  3338. list.concat(taicpu.op_reg_reg_const(A_ADD,current_procinfo.framepointer,NR_STACK_POINTER_REG,0));
  3339. end;
  3340. end;
  3341. end;
  3342. procedure tthumbcgarm.g_proc_exit(list: TAsmList; parasize: longint; nostackframe: boolean);
  3343. var
  3344. LocalSize : longint;
  3345. r: byte;
  3346. regs : tcpuregisterset;
  3347. registerarea : DWord;
  3348. stackmisalignment: pint;
  3349. stack_parameters : Boolean;
  3350. begin
  3351. if not(nostackframe) then
  3352. begin
  3353. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3354. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3355. include(regs,RS_R15);
  3356. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3357. include(regs,getsupreg(current_procinfo.framepointer));
  3358. registerarea:=0;
  3359. for r:=RS_R0 to RS_R15 do
  3360. if r in regs then
  3361. inc(registerarea,4);
  3362. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3363. LocalSize:=current_procinfo.calc_stackframe_size;
  3364. if stack_parameters then
  3365. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea
  3366. else
  3367. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3368. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  3369. (target_info.system in systems_darwin) then
  3370. begin
  3371. if (LocalSize<>0) or
  3372. ((stackmisalignment<>0) and
  3373. ((pi_do_call in current_procinfo.flags) or
  3374. (po_assembler in current_procinfo.procdef.procoptions))) then
  3375. begin
  3376. if LocalSize=0 then
  3377. else if LocalSize<=508 then
  3378. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  3379. else if LocalSize<=1016 then
  3380. begin
  3381. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3382. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,localsize-508));
  3383. end
  3384. else
  3385. begin
  3386. a_reg_alloc(list,NR_R3);
  3387. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R3);
  3388. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R3));
  3389. a_reg_dealloc(list,NR_R3);
  3390. end;
  3391. end;
  3392. if regs=[] then
  3393. begin
  3394. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3395. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3396. else
  3397. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3398. end
  3399. else
  3400. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,regs));
  3401. end;
  3402. end
  3403. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3404. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3405. else
  3406. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3407. end;
  3408. procedure tthumbcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3409. var
  3410. oppostfix:toppostfix;
  3411. usedtmpref: treference;
  3412. tmpreg,tmpreg2 : tregister;
  3413. dir : integer;
  3414. begin
  3415. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3416. FromSize := ToSize;
  3417. case FromSize of
  3418. { signed integer registers }
  3419. OS_8:
  3420. oppostfix:=PF_B;
  3421. OS_S8:
  3422. oppostfix:=PF_SB;
  3423. OS_16:
  3424. oppostfix:=PF_H;
  3425. OS_S16:
  3426. oppostfix:=PF_SH;
  3427. OS_32,
  3428. OS_S32:
  3429. oppostfix:=PF_None;
  3430. else
  3431. InternalError(200308298);
  3432. end;
  3433. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3434. begin
  3435. if target_info.endian=endian_big then
  3436. dir:=-1
  3437. else
  3438. dir:=1;
  3439. case FromSize of
  3440. OS_16,OS_S16:
  3441. begin
  3442. { only complicated references need an extra loadaddr }
  3443. if assigned(ref.symbol) or
  3444. (ref.index<>NR_NO) or
  3445. (ref.offset<-124) or
  3446. (ref.offset>124) or
  3447. { sometimes the compiler reused registers }
  3448. (reg=ref.index) or
  3449. (reg=ref.base) then
  3450. begin
  3451. tmpreg2:=getintregister(list,OS_INT);
  3452. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3453. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3454. end
  3455. else
  3456. usedtmpref:=ref;
  3457. if target_info.endian=endian_big then
  3458. inc(usedtmpref.offset,1);
  3459. tmpreg:=getintregister(list,OS_INT);
  3460. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3461. inc(usedtmpref.offset,dir);
  3462. if FromSize=OS_16 then
  3463. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3464. else
  3465. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3466. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3467. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3468. end;
  3469. OS_32,OS_S32:
  3470. begin
  3471. tmpreg:=getintregister(list,OS_INT);
  3472. { only complicated references need an extra loadaddr }
  3473. if assigned(ref.symbol) or
  3474. (ref.index<>NR_NO) or
  3475. (ref.offset<-124) or
  3476. (ref.offset>124) or
  3477. { sometimes the compiler reused registers }
  3478. (reg=ref.index) or
  3479. (reg=ref.base) then
  3480. begin
  3481. tmpreg2:=getintregister(list,OS_INT);
  3482. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3483. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3484. end
  3485. else
  3486. usedtmpref:=ref;
  3487. if ref.alignment=2 then
  3488. begin
  3489. if target_info.endian=endian_big then
  3490. inc(usedtmpref.offset,2);
  3491. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  3492. inc(usedtmpref.offset,dir*2);
  3493. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  3494. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3495. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3496. end
  3497. else
  3498. begin
  3499. if target_info.endian=endian_big then
  3500. inc(usedtmpref.offset,3);
  3501. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3502. inc(usedtmpref.offset,dir);
  3503. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3504. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3505. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3506. inc(usedtmpref.offset,dir);
  3507. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3508. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3509. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3510. inc(usedtmpref.offset,dir);
  3511. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3512. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,24));
  3513. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3514. end;
  3515. end
  3516. else
  3517. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3518. end;
  3519. end
  3520. else
  3521. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3522. if (fromsize=OS_S8) and (tosize = OS_16) then
  3523. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  3524. end;
  3525. procedure tthumbcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3526. var
  3527. l : tasmlabel;
  3528. hr : treference;
  3529. begin
  3530. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3531. internalerror(2002090902);
  3532. if is_thumb_imm(a) then
  3533. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3534. else
  3535. begin
  3536. reference_reset(hr,4);
  3537. current_asmdata.getjumplabel(l);
  3538. cg.a_label(current_procinfo.aktlocaldata,l);
  3539. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3540. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3541. hr.symbol:=l;
  3542. hr.base:=NR_PC;
  3543. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3544. end;
  3545. end;
  3546. procedure tthumbcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  3547. var
  3548. hsym : tsym;
  3549. href,
  3550. tmpref : treference;
  3551. paraloc : Pcgparalocation;
  3552. l : TAsmLabel;
  3553. begin
  3554. { calculate the parameter info for the procdef }
  3555. procdef.init_paraloc_info(callerside);
  3556. hsym:=tsym(procdef.parast.Find('self'));
  3557. if not(assigned(hsym) and
  3558. (hsym.typ=paravarsym)) then
  3559. internalerror(200305251);
  3560. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  3561. while paraloc<>nil do
  3562. with paraloc^ do
  3563. begin
  3564. case loc of
  3565. LOC_REGISTER:
  3566. begin
  3567. if is_thumb_imm(ioffset) then
  3568. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  3569. else
  3570. begin
  3571. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3572. reference_reset(tmpref,4);
  3573. current_asmdata.getjumplabel(l);
  3574. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3575. cg.a_label(current_procinfo.aktlocaldata,l);
  3576. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3577. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3578. tmpref.symbol:=l;
  3579. tmpref.base:=NR_PC;
  3580. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3581. a_op_reg_reg(list,OP_SUB,size,NR_R4,register);
  3582. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3583. end;
  3584. end;
  3585. LOC_REFERENCE:
  3586. begin
  3587. { offset in the wrapper needs to be adjusted for the stored
  3588. return address }
  3589. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),sizeof(pint));
  3590. if is_thumb_imm(ioffset) then
  3591. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  3592. else
  3593. begin
  3594. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3595. reference_reset(tmpref,4);
  3596. current_asmdata.getjumplabel(l);
  3597. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3598. cg.a_label(current_procinfo.aktlocaldata,l);
  3599. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3600. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3601. tmpref.symbol:=l;
  3602. tmpref.base:=NR_PC;
  3603. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3604. a_op_reg_ref(list,OP_SUB,size,NR_R4,href);
  3605. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3606. end;
  3607. end
  3608. else
  3609. internalerror(200309189);
  3610. end;
  3611. paraloc:=next;
  3612. end;
  3613. end;
  3614. function tthumbcgarm.handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference;
  3615. var
  3616. href : treference;
  3617. tmpreg : TRegister;
  3618. begin
  3619. href:=ref;
  3620. if { LDR/STR limitations }
  3621. (
  3622. (((op=A_LDR) and (oppostfix=PF_None)) or
  3623. ((op=A_STR) and (oppostfix=PF_None))) and
  3624. (ref.base<>NR_STACK_POINTER_REG) and
  3625. (abs(ref.offset)>124)
  3626. ) or
  3627. { LDRB/STRB limitations }
  3628. (
  3629. (((op=A_LDR) and (oppostfix=PF_B)) or
  3630. ((op=A_LDRB) and (oppostfix=PF_None)) or
  3631. ((op=A_STR) and (oppostfix=PF_B)) or
  3632. ((op=A_STRB) and (oppostfix=PF_None))) and
  3633. ((ref.base=NR_STACK_POINTER_REG) or
  3634. (ref.index=NR_STACK_POINTER_REG) or
  3635. (abs(ref.offset)>31)
  3636. )
  3637. ) or
  3638. { LDRH/STRH limitations }
  3639. (
  3640. (((op=A_LDR) and (oppostfix=PF_H)) or
  3641. ((op=A_LDRH) and (oppostfix=PF_None)) or
  3642. ((op=A_STR) and (oppostfix=PF_H)) or
  3643. ((op=A_STRH) and (oppostfix=PF_None))) and
  3644. ((ref.base=NR_STACK_POINTER_REG) or
  3645. (ref.index=NR_STACK_POINTER_REG) or
  3646. (abs(ref.offset)>62) or
  3647. ((abs(ref.offset) mod 2)<>0)
  3648. )
  3649. ) then
  3650. begin
  3651. tmpreg:=getintregister(list,OS_ADDR);
  3652. a_loadaddr_ref_reg(list,ref,tmpreg);
  3653. reference_reset_base(href,tmpreg,0,ref.alignment);
  3654. end
  3655. else if (op=A_LDR) and
  3656. (oppostfix in [PF_None]) and
  3657. (ref.base=NR_STACK_POINTER_REG) and
  3658. (abs(ref.offset)>1020) then
  3659. begin
  3660. tmpreg:=getintregister(list,OS_ADDR);
  3661. a_loadaddr_ref_reg(list,ref,tmpreg);
  3662. reference_reset_base(href,tmpreg,0,ref.alignment);
  3663. end
  3664. else if (op=A_LDR) and
  3665. ((oppostfix in [PF_SH,PF_SB]) or
  3666. (abs(ref.offset)>124)) then
  3667. begin
  3668. tmpreg:=getintregister(list,OS_ADDR);
  3669. a_loadaddr_ref_reg(list,ref,tmpreg);
  3670. reference_reset_base(href,tmpreg,0,ref.alignment);
  3671. end;
  3672. Result:=inherited handle_load_store(list, op, oppostfix, reg, href);
  3673. end;
  3674. procedure tthumbcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  3675. var
  3676. tmpreg : tregister;
  3677. begin
  3678. case op of
  3679. OP_NEG:
  3680. list.concat(taicpu.op_reg_reg(A_NEG,dst,src));
  3681. OP_NOT:
  3682. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  3683. OP_DIV,OP_IDIV:
  3684. internalerror(200308284);
  3685. OP_ROL:
  3686. begin
  3687. if not(size in [OS_32,OS_S32]) then
  3688. internalerror(2008072801);
  3689. { simulate ROL by ror'ing 32-value }
  3690. tmpreg:=getintregister(list,OS_32);
  3691. a_load_const_reg(list,OS_32,32,tmpreg);
  3692. list.concat(taicpu.op_reg_reg(A_SUB,tmpreg,src));
  3693. list.concat(taicpu.op_reg_reg(A_ROR,dst,src));
  3694. end;
  3695. else
  3696. begin
  3697. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3698. list.concat(setoppostfix(
  3699. taicpu.op_reg_reg(op_reg_opcg2asmop[op],dst,src),op_reg_postfix[op]));
  3700. end;
  3701. end;
  3702. maybeadjustresult(list,op,size,dst);
  3703. end;
  3704. procedure tthumbcgarm.a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);
  3705. var
  3706. tmpreg : tregister;
  3707. {$ifdef DUMMY}
  3708. l1 : longint;
  3709. {$endif DUMMY}
  3710. begin
  3711. //!!! ovloc.loc:=LOC_VOID;
  3712. if {$ifopt R+}(a<>-2147483648) and{$endif} {!!!!!! not setflags and } is_thumb_imm(-a) then
  3713. case op of
  3714. OP_ADD:
  3715. begin
  3716. op:=OP_SUB;
  3717. a:=aint(dword(-a));
  3718. end;
  3719. OP_SUB:
  3720. begin
  3721. op:=OP_ADD;
  3722. a:=aint(dword(-a));
  3723. end
  3724. end;
  3725. if is_thumb_imm(a) and (op in [OP_ADD,OP_SUB]) then
  3726. begin
  3727. // if cgsetflags or setflags then
  3728. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3729. list.concat(setoppostfix(
  3730. taicpu.op_reg_const(op_reg_opcg2asmop[op],dst,a),op_reg_postfix[op]));
  3731. if (cgsetflags {!!! or setflags }) and (size in [OS_8,OS_16,OS_32]) then
  3732. begin
  3733. //!!! ovloc.loc:=LOC_FLAGS;
  3734. case op of
  3735. OP_ADD:
  3736. //!!! ovloc.resflags:=F_CS;
  3737. ;
  3738. OP_SUB:
  3739. //!!! ovloc.resflags:=F_CC;
  3740. ;
  3741. end;
  3742. end;
  3743. end
  3744. else
  3745. begin
  3746. { there could be added some more sophisticated optimizations }
  3747. if (op in [OP_MUL,OP_IMUL,OP_DIV,OP_IDIV]) and (a=1) then
  3748. a_load_reg_reg(list,size,size,dst,dst)
  3749. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  3750. a_load_const_reg(list,size,0,dst)
  3751. else if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  3752. a_op_reg_reg(list,OP_NEG,size,dst,dst)
  3753. { we do this here instead in the peephole optimizer because
  3754. it saves us a register }
  3755. {$ifdef DUMMY}
  3756. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  3757. a_op_const_reg_reg(list,OP_SHL,size,l1,dst,dst)
  3758. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  3759. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  3760. begin
  3761. if l1>32 then{roozbeh does this ever happen?}
  3762. internalerror(200308296);
  3763. shifterop_reset(so);
  3764. so.shiftmode:=SM_LSL;
  3765. so.shiftimm:=l1;
  3766. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,dst,so));
  3767. end
  3768. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  3769. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  3770. begin
  3771. if l1>32 then{does this ever happen?}
  3772. internalerror(201205181);
  3773. shifterop_reset(so);
  3774. so.shiftmode:=SM_LSL;
  3775. so.shiftimm:=l1;
  3776. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,dst,dst,so));
  3777. end
  3778. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,dst,dst) then
  3779. begin
  3780. { nothing to do on success }
  3781. end
  3782. {$endif DUMMY}
  3783. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  3784. Just using mov x, #0 might allow some easier optimizations down the line. }
  3785. else if (op = OP_AND) and (dword(a)=0) then
  3786. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  3787. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  3788. else if (op = OP_AND) and (not(dword(a))=0) then
  3789. // do nothing
  3790. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  3791. broader range of shifterconstants.}
  3792. {$ifdef DUMMY}
  3793. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  3794. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,not(dword(a))))
  3795. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  3796. begin
  3797. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm1));
  3798. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  3799. end
  3800. else if (op in [OP_ADD, OP_SUB, OP_OR]) and
  3801. not(cgsetflags or setflags) and
  3802. split_into_shifter_const(a, imm1, imm2) then
  3803. begin
  3804. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm1));
  3805. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  3806. end
  3807. {$endif DUMMY}
  3808. else if (op in [OP_SHL, OP_SHR, OP_SAR]) then
  3809. begin
  3810. list.concat(taicpu.op_reg_reg_const(op_reg_opcg2asmop[op],dst,dst,a));
  3811. end
  3812. else
  3813. begin
  3814. tmpreg:=getintregister(list,size);
  3815. a_load_const_reg(list,size,a,tmpreg);
  3816. a_op_reg_reg(list,op,size,tmpreg,dst);
  3817. end;
  3818. end;
  3819. maybeadjustresult(list,op,size,dst);
  3820. end;
  3821. procedure tthumbcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister);
  3822. begin
  3823. if (op=OP_ADD) and (src=NR_R13) and (dst<>NR_R13) and ((a mod 4)=0) and (a>0) and (a<=1020) then
  3824. list.concat(taicpu.op_reg_reg_const(A_ADD,dst,src,a))
  3825. else
  3826. inherited a_op_const_reg_reg(list,op,size,a,src,dst);
  3827. end;
  3828. procedure tthumbcgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  3829. var
  3830. l1,l2 : tasmlabel;
  3831. ai : taicpu;
  3832. begin
  3833. current_asmdata.getjumplabel(l1);
  3834. current_asmdata.getjumplabel(l2);
  3835. ai:=setcondition(taicpu.op_sym(A_B,l1),flags_to_cond(f));
  3836. ai.is_jmp:=true;
  3837. list.concat(ai);
  3838. list.concat(taicpu.op_reg_const(A_MOV,reg,0));
  3839. list.concat(taicpu.op_sym(A_B,l2));
  3840. cg.a_label(list,l1);
  3841. list.concat(taicpu.op_reg_const(A_MOV,reg,1));
  3842. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3843. cg.a_label(list,l2);
  3844. end;
  3845. procedure tthumb2cgarm.init_register_allocators;
  3846. begin
  3847. inherited init_register_allocators;
  3848. { currently, we save R14 always, so we can use it }
  3849. if (target_info.system<>system_arm_darwin) then
  3850. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3851. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3852. RS_R9,RS_R10,RS_R12,RS_R14],first_int_imreg,[])
  3853. else
  3854. { r9 is not available on Darwin according to the llvm code generator }
  3855. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3856. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3857. RS_R10,RS_R12,RS_R14],first_int_imreg,[]);
  3858. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  3859. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  3860. if current_settings.fputype=fpu_vfpv3 then
  3861. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3862. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3863. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  3864. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3865. ],first_mm_imreg,[])
  3866. else if current_settings.fputype in [fpu_fpv4_s16,fpu_vfpv3_d16] then
  3867. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3868. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3869. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3870. ],first_mm_imreg,[])
  3871. else
  3872. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBNONE,
  3873. [RS_S0,RS_S1,RS_R2,RS_R3,RS_R4,RS_S31],first_mm_imreg,[]);
  3874. end;
  3875. procedure tthumb2cgarm.done_register_allocators;
  3876. begin
  3877. rg[R_INTREGISTER].free;
  3878. rg[R_FPUREGISTER].free;
  3879. rg[R_MMREGISTER].free;
  3880. inherited done_register_allocators;
  3881. end;
  3882. procedure tthumb2cgarm.a_call_reg(list : TAsmList;reg: tregister);
  3883. begin
  3884. list.concat(taicpu.op_reg(A_BLX, reg));
  3885. {
  3886. the compiler does not properly set this flag anymore in pass 1, and
  3887. for now we only need it after pass 2 (I hope) (JM)
  3888. if not(pi_do_call in current_procinfo.flags) then
  3889. internalerror(2003060703);
  3890. }
  3891. include(current_procinfo.flags,pi_do_call);
  3892. end;
  3893. procedure tthumb2cgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3894. var
  3895. l : tasmlabel;
  3896. hr : treference;
  3897. begin
  3898. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3899. internalerror(2002090902);
  3900. if is_thumb32_imm(a) then
  3901. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3902. else if is_thumb32_imm(not(a)) then
  3903. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  3904. else if (a and $FFFF)=a then
  3905. list.concat(taicpu.op_reg_const(A_MOVW,reg,a))
  3906. else
  3907. begin
  3908. reference_reset(hr,4);
  3909. current_asmdata.getjumplabel(l);
  3910. cg.a_label(current_procinfo.aktlocaldata,l);
  3911. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3912. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3913. hr.symbol:=l;
  3914. hr.base:=NR_PC;
  3915. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3916. end;
  3917. end;
  3918. procedure tthumb2cgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3919. var
  3920. oppostfix:toppostfix;
  3921. usedtmpref: treference;
  3922. tmpreg,tmpreg2 : tregister;
  3923. so : tshifterop;
  3924. dir : integer;
  3925. begin
  3926. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3927. FromSize := ToSize;
  3928. case FromSize of
  3929. { signed integer registers }
  3930. OS_8:
  3931. oppostfix:=PF_B;
  3932. OS_S8:
  3933. oppostfix:=PF_SB;
  3934. OS_16:
  3935. oppostfix:=PF_H;
  3936. OS_S16:
  3937. oppostfix:=PF_SH;
  3938. OS_32,
  3939. OS_S32:
  3940. oppostfix:=PF_None;
  3941. else
  3942. InternalError(200308299);
  3943. end;
  3944. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3945. begin
  3946. if target_info.endian=endian_big then
  3947. dir:=-1
  3948. else
  3949. dir:=1;
  3950. case FromSize of
  3951. OS_16,OS_S16:
  3952. begin
  3953. { only complicated references need an extra loadaddr }
  3954. if assigned(ref.symbol) or
  3955. (ref.index<>NR_NO) or
  3956. (ref.offset<-255) or
  3957. (ref.offset>4094) or
  3958. { sometimes the compiler reused registers }
  3959. (reg=ref.index) or
  3960. (reg=ref.base) then
  3961. begin
  3962. tmpreg2:=getintregister(list,OS_INT);
  3963. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3964. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3965. end
  3966. else
  3967. usedtmpref:=ref;
  3968. if target_info.endian=endian_big then
  3969. inc(usedtmpref.offset,1);
  3970. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  3971. tmpreg:=getintregister(list,OS_INT);
  3972. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3973. inc(usedtmpref.offset,dir);
  3974. if FromSize=OS_16 then
  3975. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3976. else
  3977. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3978. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  3979. end;
  3980. OS_32,OS_S32:
  3981. begin
  3982. tmpreg:=getintregister(list,OS_INT);
  3983. { only complicated references need an extra loadaddr }
  3984. if assigned(ref.symbol) or
  3985. (ref.index<>NR_NO) or
  3986. (ref.offset<-255) or
  3987. (ref.offset>4092) or
  3988. { sometimes the compiler reused registers }
  3989. (reg=ref.index) or
  3990. (reg=ref.base) then
  3991. begin
  3992. tmpreg2:=getintregister(list,OS_INT);
  3993. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3994. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3995. end
  3996. else
  3997. usedtmpref:=ref;
  3998. shifterop_reset(so);so.shiftmode:=SM_LSL;
  3999. if ref.alignment=2 then
  4000. begin
  4001. if target_info.endian=endian_big then
  4002. inc(usedtmpref.offset,2);
  4003. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  4004. inc(usedtmpref.offset,dir*2);
  4005. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  4006. so.shiftimm:=16;
  4007. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4008. end
  4009. else
  4010. begin
  4011. if target_info.endian=endian_big then
  4012. inc(usedtmpref.offset,3);
  4013. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  4014. inc(usedtmpref.offset,dir);
  4015. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4016. so.shiftimm:=8;
  4017. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4018. inc(usedtmpref.offset,dir);
  4019. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4020. so.shiftimm:=16;
  4021. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4022. inc(usedtmpref.offset,dir);
  4023. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4024. so.shiftimm:=24;
  4025. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4026. end;
  4027. end
  4028. else
  4029. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4030. end;
  4031. end
  4032. else
  4033. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4034. if (fromsize=OS_S8) and (tosize = OS_16) then
  4035. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  4036. end;
  4037. procedure tthumb2cgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  4038. begin
  4039. if op = OP_NOT then
  4040. begin
  4041. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  4042. case size of
  4043. OS_8: list.concat(taicpu.op_reg_reg(A_UXTB,dst,dst));
  4044. OS_S8: list.concat(taicpu.op_reg_reg(A_SXTB,dst,dst));
  4045. OS_16: list.concat(taicpu.op_reg_reg(A_UXTH,dst,dst));
  4046. OS_S16: list.concat(taicpu.op_reg_reg(A_SXTH,dst,dst));
  4047. end;
  4048. end
  4049. else
  4050. inherited a_op_reg_reg(list, op, size, src, dst);
  4051. end;
  4052. procedure tthumb2cgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4053. var
  4054. shift, width : byte;
  4055. tmpreg : tregister;
  4056. so : tshifterop;
  4057. l1 : longint;
  4058. begin
  4059. ovloc.loc:=LOC_VOID;
  4060. if {$ifopt R+}(a<>-2147483648) and{$endif} is_shifter_const(-a,shift) then
  4061. case op of
  4062. OP_ADD:
  4063. begin
  4064. op:=OP_SUB;
  4065. a:=aint(dword(-a));
  4066. end;
  4067. OP_SUB:
  4068. begin
  4069. op:=OP_ADD;
  4070. a:=aint(dword(-a));
  4071. end
  4072. end;
  4073. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  4074. case op of
  4075. OP_NEG,OP_NOT,
  4076. OP_DIV,OP_IDIV:
  4077. internalerror(200308285);
  4078. OP_SHL:
  4079. begin
  4080. if a>32 then
  4081. internalerror(2014020703);
  4082. if a<>0 then
  4083. begin
  4084. shifterop_reset(so);
  4085. so.shiftmode:=SM_LSL;
  4086. so.shiftimm:=a;
  4087. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4088. end
  4089. else
  4090. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4091. end;
  4092. OP_ROL:
  4093. begin
  4094. if a>32 then
  4095. internalerror(2014020704);
  4096. if a<>0 then
  4097. begin
  4098. shifterop_reset(so);
  4099. so.shiftmode:=SM_ROR;
  4100. so.shiftimm:=32-a;
  4101. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4102. end
  4103. else
  4104. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4105. end;
  4106. OP_ROR:
  4107. begin
  4108. if a>32 then
  4109. internalerror(2014020705);
  4110. if a<>0 then
  4111. begin
  4112. shifterop_reset(so);
  4113. so.shiftmode:=SM_ROR;
  4114. so.shiftimm:=a;
  4115. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4116. end
  4117. else
  4118. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4119. end;
  4120. OP_SHR:
  4121. begin
  4122. if a>32 then
  4123. internalerror(200308292);
  4124. shifterop_reset(so);
  4125. if a<>0 then
  4126. begin
  4127. so.shiftmode:=SM_LSR;
  4128. so.shiftimm:=a;
  4129. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4130. end
  4131. else
  4132. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4133. end;
  4134. OP_SAR:
  4135. begin
  4136. if a>32 then
  4137. internalerror(200308295);
  4138. if a<>0 then
  4139. begin
  4140. shifterop_reset(so);
  4141. so.shiftmode:=SM_ASR;
  4142. so.shiftimm:=a;
  4143. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4144. end
  4145. else
  4146. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4147. end;
  4148. else
  4149. if (op in [OP_SUB, OP_ADD]) and
  4150. ((a < 0) or
  4151. (a > 4095)) then
  4152. begin
  4153. tmpreg:=getintregister(list,size);
  4154. a_load_const_reg(list, size, a, tmpreg);
  4155. if cgsetflags or setflags then
  4156. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4157. list.concat(setoppostfix(
  4158. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4159. end
  4160. else
  4161. begin
  4162. if cgsetflags or setflags then
  4163. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4164. list.concat(setoppostfix(
  4165. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4166. end;
  4167. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  4168. begin
  4169. ovloc.loc:=LOC_FLAGS;
  4170. case op of
  4171. OP_ADD:
  4172. ovloc.resflags:=F_CS;
  4173. OP_SUB:
  4174. ovloc.resflags:=F_CC;
  4175. end;
  4176. end;
  4177. end
  4178. else
  4179. begin
  4180. { there could be added some more sophisticated optimizations }
  4181. if (op in [OP_MUL,OP_IMUL]) and (a=1) then
  4182. a_load_reg_reg(list,size,size,src,dst)
  4183. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  4184. a_load_const_reg(list,size,0,dst)
  4185. else if (op in [OP_IMUL]) and (a=-1) then
  4186. a_op_reg_reg(list,OP_NEG,size,src,dst)
  4187. { we do this here instead in the peephole optimizer because
  4188. it saves us a register }
  4189. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  4190. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  4191. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  4192. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  4193. begin
  4194. if l1>32 then{roozbeh does this ever happen?}
  4195. internalerror(200308296);
  4196. shifterop_reset(so);
  4197. so.shiftmode:=SM_LSL;
  4198. so.shiftimm:=l1;
  4199. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  4200. end
  4201. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  4202. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  4203. begin
  4204. if l1>32 then{does this ever happen?}
  4205. internalerror(201205181);
  4206. shifterop_reset(so);
  4207. so.shiftmode:=SM_LSL;
  4208. so.shiftimm:=l1;
  4209. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  4210. end
  4211. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  4212. begin
  4213. { nothing to do on success }
  4214. end
  4215. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  4216. Just using mov x, #0 might allow some easier optimizations down the line. }
  4217. else if (op = OP_AND) and (dword(a)=0) then
  4218. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  4219. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  4220. else if (op = OP_AND) and (not(dword(a))=0) then
  4221. list.concat(taicpu.op_reg_reg(A_MOV,dst,src))
  4222. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  4223. broader range of shifterconstants.}
  4224. {else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  4225. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))}
  4226. else if (op = OP_AND) and is_thumb32_imm(a) then
  4227. list.concat(taicpu.op_reg_reg_const(A_AND,dst,src,dword(a)))
  4228. else if (op = OP_AND) and (a = $FFFF) then
  4229. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  4230. else if (op = OP_AND) and is_thumb32_imm(not(dword(a))) then
  4231. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  4232. else if (op = OP_AND) and is_continuous_mask(not(a), shift, width) then
  4233. begin
  4234. a_load_reg_reg(list,size,size,src,dst);
  4235. list.concat(taicpu.op_reg_const_const(A_BFC,dst,shift,width))
  4236. end
  4237. else
  4238. begin
  4239. tmpreg:=getintregister(list,size);
  4240. a_load_const_reg(list,size,a,tmpreg);
  4241. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  4242. end;
  4243. end;
  4244. maybeadjustresult(list,op,size,dst);
  4245. end;
  4246. const
  4247. op_reg_reg_opcg2asmopThumb2: array[TOpCG] of tasmop =
  4248. (A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NONE,A_MVN,A_ORR,
  4249. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  4250. procedure tthumb2cgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4251. var
  4252. so : tshifterop;
  4253. tmpreg,overflowreg : tregister;
  4254. asmop : tasmop;
  4255. begin
  4256. ovloc.loc:=LOC_VOID;
  4257. case op of
  4258. OP_NEG,OP_NOT:
  4259. internalerror(200308286);
  4260. OP_ROL:
  4261. begin
  4262. if not(size in [OS_32,OS_S32]) then
  4263. internalerror(2008072801);
  4264. { simulate ROL by ror'ing 32-value }
  4265. tmpreg:=getintregister(list,OS_32);
  4266. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,32));
  4267. list.concat(taicpu.op_reg_reg_reg(A_SUB,src1,tmpreg,src1));
  4268. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4269. end;
  4270. OP_ROR:
  4271. begin
  4272. if not(size in [OS_32,OS_S32]) then
  4273. internalerror(2008072802);
  4274. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4275. end;
  4276. OP_IMUL,
  4277. OP_MUL:
  4278. begin
  4279. if cgsetflags or setflags then
  4280. begin
  4281. overflowreg:=getintregister(list,size);
  4282. if op=OP_IMUL then
  4283. asmop:=A_SMULL
  4284. else
  4285. asmop:=A_UMULL;
  4286. { the arm doesn't allow that rd and rm are the same }
  4287. if dst=src2 then
  4288. begin
  4289. if dst<>src1 then
  4290. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  4291. else
  4292. begin
  4293. tmpreg:=getintregister(list,size);
  4294. a_load_reg_reg(list,size,size,src2,dst);
  4295. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  4296. end;
  4297. end
  4298. else
  4299. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  4300. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4301. if op=OP_IMUL then
  4302. begin
  4303. shifterop_reset(so);
  4304. so.shiftmode:=SM_ASR;
  4305. so.shiftimm:=31;
  4306. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  4307. end
  4308. else
  4309. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  4310. ovloc.loc:=LOC_FLAGS;
  4311. ovloc.resflags:=F_NE;
  4312. end
  4313. else
  4314. begin
  4315. { the arm doesn't allow that rd and rm are the same }
  4316. if dst=src2 then
  4317. begin
  4318. if dst<>src1 then
  4319. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  4320. else
  4321. begin
  4322. tmpreg:=getintregister(list,size);
  4323. a_load_reg_reg(list,size,size,src2,dst);
  4324. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  4325. end;
  4326. end
  4327. else
  4328. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  4329. end;
  4330. end;
  4331. else
  4332. begin
  4333. if cgsetflags or setflags then
  4334. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4335. {$ifdef dummy}
  4336. { R13 is not allowed for certain instruction operands }
  4337. if op_reg_reg_opcg2asmopThumb2[op] in [A_ADD,A_SUB,A_AND,A_BIC,A_EOR] then
  4338. begin
  4339. if getsupreg(dst)=RS_R13 then
  4340. begin
  4341. tmpreg:=getintregister(list,OS_INT);
  4342. a_load_reg_reg(list,OS_INT,OS_INT,dst,tmpreg);
  4343. dst:=tmpreg;
  4344. end;
  4345. if getsupreg(src1)=RS_R13 then
  4346. begin
  4347. tmpreg:=getintregister(list,OS_INT);
  4348. a_load_reg_reg(list,OS_INT,OS_INT,src1,tmpreg);
  4349. src1:=tmpreg;
  4350. end;
  4351. end;
  4352. {$endif}
  4353. list.concat(setoppostfix(
  4354. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmopThumb2[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4355. end;
  4356. end;
  4357. maybeadjustresult(list,op,size,dst);
  4358. end;
  4359. procedure tthumb2cgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  4360. begin
  4361. list.concat(taicpu.op_cond(A_ITE, flags_to_cond(f)));
  4362. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  4363. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  4364. end;
  4365. procedure tthumb2cgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  4366. var
  4367. ref : treference;
  4368. shift : byte;
  4369. firstfloatreg,lastfloatreg,
  4370. r : byte;
  4371. regs : tcpuregisterset;
  4372. stackmisalignment: pint;
  4373. begin
  4374. LocalSize:=align(LocalSize,4);
  4375. { call instruction does not put anything on the stack }
  4376. stackmisalignment:=0;
  4377. if not(nostackframe) then
  4378. begin
  4379. firstfloatreg:=RS_NO;
  4380. lastfloatreg:=RS_NO;
  4381. { save floating point registers? }
  4382. for r:=RS_F0 to RS_F7 do
  4383. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4384. begin
  4385. if firstfloatreg=RS_NO then
  4386. firstfloatreg:=r;
  4387. lastfloatreg:=r;
  4388. inc(stackmisalignment,12);
  4389. end;
  4390. a_reg_alloc(list,NR_STACK_POINTER_REG);
  4391. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4392. begin
  4393. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  4394. a_reg_alloc(list,NR_R12);
  4395. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  4396. end;
  4397. { save int registers }
  4398. reference_reset(ref,4);
  4399. ref.index:=NR_STACK_POINTER_REG;
  4400. ref.addressmode:=AM_PREINDEXED;
  4401. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4402. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4403. regs:=regs+[RS_FRAME_POINTER_REG,RS_R14]
  4404. else if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  4405. include(regs,RS_R14);
  4406. if regs<>[] then
  4407. begin
  4408. for r:=RS_R0 to RS_R15 do
  4409. if (r in regs) then
  4410. inc(stackmisalignment,4);
  4411. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4412. end;
  4413. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4414. begin
  4415. { the framepointer now points to the saved R15, so the saved
  4416. framepointer is at R11-12 (for get_caller_frame) }
  4417. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  4418. a_reg_dealloc(list,NR_R12);
  4419. end;
  4420. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4421. if (LocalSize<>0) or
  4422. ((stackmisalignment<>0) and
  4423. ((pi_do_call in current_procinfo.flags) or
  4424. (po_assembler in current_procinfo.procdef.procoptions))) then
  4425. begin
  4426. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4427. if not(is_shifter_const(localsize,shift)) then
  4428. begin
  4429. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  4430. a_reg_alloc(list,NR_R12);
  4431. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4432. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  4433. a_reg_dealloc(list,NR_R12);
  4434. end
  4435. else
  4436. begin
  4437. a_reg_dealloc(list,NR_R12);
  4438. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  4439. end;
  4440. end;
  4441. if firstfloatreg<>RS_NO then
  4442. begin
  4443. reference_reset(ref,4);
  4444. if tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023 then
  4445. begin
  4446. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  4447. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4448. ref.base:=NR_R12;
  4449. end
  4450. else
  4451. begin
  4452. ref.base:=current_procinfo.framepointer;
  4453. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  4454. end;
  4455. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4456. lastfloatreg-firstfloatreg+1,ref));
  4457. end;
  4458. end;
  4459. end;
  4460. procedure tthumb2cgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  4461. var
  4462. ref : treference;
  4463. firstfloatreg,lastfloatreg,
  4464. r : byte;
  4465. shift : byte;
  4466. regs : tcpuregisterset;
  4467. LocalSize : longint;
  4468. stackmisalignment: pint;
  4469. begin
  4470. if not(nostackframe) then
  4471. begin
  4472. stackmisalignment:=0;
  4473. { restore floating point register }
  4474. firstfloatreg:=RS_NO;
  4475. lastfloatreg:=RS_NO;
  4476. { save floating point registers? }
  4477. for r:=RS_F0 to RS_F7 do
  4478. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4479. begin
  4480. if firstfloatreg=RS_NO then
  4481. firstfloatreg:=r;
  4482. lastfloatreg:=r;
  4483. { floating point register space is already included in
  4484. localsize below by calc_stackframe_size
  4485. inc(stackmisalignment,12);
  4486. }
  4487. end;
  4488. if firstfloatreg<>RS_NO then
  4489. begin
  4490. reference_reset(ref,4);
  4491. if tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023 then
  4492. begin
  4493. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  4494. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4495. ref.base:=NR_R12;
  4496. end
  4497. else
  4498. begin
  4499. ref.base:=current_procinfo.framepointer;
  4500. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  4501. end;
  4502. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4503. lastfloatreg-firstfloatreg+1,ref));
  4504. end;
  4505. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4506. if (pi_do_call in current_procinfo.flags) or (regs<>[]) then
  4507. begin
  4508. exclude(regs,RS_R14);
  4509. include(regs,RS_R15);
  4510. end;
  4511. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  4512. regs:=regs+[RS_FRAME_POINTER_REG,RS_R15];
  4513. for r:=RS_R0 to RS_R15 do
  4514. if (r in regs) then
  4515. inc(stackmisalignment,4);
  4516. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4517. LocalSize:=current_procinfo.calc_stackframe_size;
  4518. if (LocalSize<>0) or
  4519. ((stackmisalignment<>0) and
  4520. ((pi_do_call in current_procinfo.flags) or
  4521. (po_assembler in current_procinfo.procdef.procoptions))) then
  4522. begin
  4523. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4524. if not(is_shifter_const(LocalSize,shift)) then
  4525. begin
  4526. a_reg_alloc(list,NR_R12);
  4527. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4528. list.concat(taicpu.op_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_R12));
  4529. a_reg_dealloc(list,NR_R12);
  4530. end
  4531. else
  4532. begin
  4533. a_reg_dealloc(list,NR_R12);
  4534. list.concat(taicpu.op_reg_const(A_ADD,NR_STACK_POINTER_REG,LocalSize));
  4535. end;
  4536. end;
  4537. if regs=[] then
  4538. list.concat(taicpu.op_reg_reg(A_MOV,NR_R15,NR_R14))
  4539. else
  4540. begin
  4541. reference_reset(ref,4);
  4542. ref.index:=NR_STACK_POINTER_REG;
  4543. ref.addressmode:=AM_PREINDEXED;
  4544. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4545. end;
  4546. end
  4547. else
  4548. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14));
  4549. end;
  4550. function tthumb2cgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  4551. var
  4552. tmpreg : tregister;
  4553. tmpref : treference;
  4554. l : tasmlabel;
  4555. begin
  4556. tmpreg:=NR_NO;
  4557. { Be sure to have a base register }
  4558. if (ref.base=NR_NO) then
  4559. begin
  4560. if ref.shiftmode<>SM_None then
  4561. internalerror(2014020706);
  4562. ref.base:=ref.index;
  4563. ref.index:=NR_NO;
  4564. end;
  4565. { absolute symbols can't be handled directly, we've to store the symbol reference
  4566. in the text segment and access it pc relative
  4567. For now, we assume that references where base or index equals to PC are already
  4568. relative, all other references are assumed to be absolute and thus they need
  4569. to be handled extra.
  4570. A proper solution would be to change refoptions to a set and store the information
  4571. if the symbol is absolute or relative there.
  4572. }
  4573. if (assigned(ref.symbol) and
  4574. not(is_pc(ref.base)) and
  4575. not(is_pc(ref.index))
  4576. ) or
  4577. { [#xxx] isn't a valid address operand }
  4578. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  4579. //(ref.offset<-4095) or
  4580. (ref.offset<-255) or
  4581. (ref.offset>4095) or
  4582. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  4583. ((ref.offset<-255) or
  4584. (ref.offset>255)
  4585. )
  4586. ) or
  4587. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  4588. ((ref.offset<-1020) or
  4589. (ref.offset>1020) or
  4590. ((abs(ref.offset) mod 4)<>0) or
  4591. { the usual pc relative symbol handling assumes possible offsets of +/- 4095 }
  4592. assigned(ref.symbol)
  4593. )
  4594. ) then
  4595. begin
  4596. reference_reset(tmpref,4);
  4597. { load symbol }
  4598. tmpreg:=getintregister(list,OS_INT);
  4599. if assigned(ref.symbol) then
  4600. begin
  4601. current_asmdata.getjumplabel(l);
  4602. cg.a_label(current_procinfo.aktlocaldata,l);
  4603. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  4604. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset));
  4605. { load consts entry }
  4606. tmpref.symbol:=l;
  4607. tmpref.base:=NR_R15;
  4608. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  4609. { in case of LDF/STF, we got rid of the NR_R15 }
  4610. if is_pc(ref.base) then
  4611. ref.base:=NR_NO;
  4612. if is_pc(ref.index) then
  4613. ref.index:=NR_NO;
  4614. end
  4615. else
  4616. a_load_const_reg(list,OS_ADDR,ref.offset,tmpreg);
  4617. if (ref.base<>NR_NO) then
  4618. begin
  4619. if ref.index<>NR_NO then
  4620. begin
  4621. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4622. ref.base:=tmpreg;
  4623. end
  4624. else
  4625. begin
  4626. ref.index:=tmpreg;
  4627. ref.shiftimm:=0;
  4628. ref.signindex:=1;
  4629. ref.shiftmode:=SM_None;
  4630. end;
  4631. end
  4632. else
  4633. ref.base:=tmpreg;
  4634. ref.offset:=0;
  4635. ref.symbol:=nil;
  4636. end;
  4637. if (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  4638. begin
  4639. if tmpreg<>NR_NO then
  4640. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg,tmpreg)
  4641. else
  4642. begin
  4643. tmpreg:=getintregister(list,OS_ADDR);
  4644. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg);
  4645. ref.base:=tmpreg;
  4646. end;
  4647. ref.offset:=0;
  4648. end;
  4649. { Hack? Thumb2 doesn't allow PC indexed addressing modes(although it does in the specification) }
  4650. if (ref.base=NR_R15) and (ref.index<>NR_NO) and (ref.shiftmode <> sm_none) then
  4651. begin
  4652. tmpreg:=getintregister(list,OS_ADDR);
  4653. list.concat(taicpu.op_reg_reg(A_MOV, tmpreg, NR_R15));
  4654. ref.base := tmpreg;
  4655. end;
  4656. { floating point operations have only limited references
  4657. we expect here, that a base is already set }
  4658. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  4659. begin
  4660. if ref.shiftmode<>SM_none then
  4661. internalerror(200309121);
  4662. if tmpreg<>NR_NO then
  4663. begin
  4664. if ref.base=tmpreg then
  4665. begin
  4666. if ref.signindex<0 then
  4667. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,tmpreg,ref.index))
  4668. else
  4669. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,tmpreg,ref.index));
  4670. ref.index:=NR_NO;
  4671. end
  4672. else
  4673. begin
  4674. if ref.index<>tmpreg then
  4675. internalerror(200403161);
  4676. if ref.signindex<0 then
  4677. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,ref.base,tmpreg))
  4678. else
  4679. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4680. ref.base:=tmpreg;
  4681. ref.index:=NR_NO;
  4682. end;
  4683. end
  4684. else
  4685. begin
  4686. tmpreg:=getintregister(list,OS_ADDR);
  4687. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));
  4688. ref.base:=tmpreg;
  4689. ref.index:=NR_NO;
  4690. end;
  4691. end;
  4692. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  4693. Result := ref;
  4694. end;
  4695. procedure tthumb2cgarm.a_loadmm_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister; shuffle: pmmshuffle);
  4696. var
  4697. instr: taicpu;
  4698. begin
  4699. if (fromsize=OS_F32) and
  4700. (tosize=OS_F32) then
  4701. begin
  4702. instr:=setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32);
  4703. list.Concat(instr);
  4704. add_move_instruction(instr);
  4705. end
  4706. else if (fromsize=OS_F64) and
  4707. (tosize=OS_F64) then
  4708. begin
  4709. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,tregister(longint(reg2)+1),tregister(longint(reg1)+1)), PF_F32));
  4710. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32));
  4711. end
  4712. else if (fromsize=OS_F32) and
  4713. (tosize=OS_F64) then
  4714. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VCVT,reg2,reg1), PF_F32))
  4715. begin
  4716. //list.concat(nil);
  4717. end;
  4718. end;
  4719. procedure tthumb2cgarm.a_loadmm_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  4720. begin
  4721. handle_load_store(list,A_VLDR,PF_None,reg,ref);
  4722. end;
  4723. procedure tthumb2cgarm.a_loadmm_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  4724. begin
  4725. handle_load_store(list,A_VSTR,PF_None,reg,ref);
  4726. end;
  4727. procedure tthumb2cgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize: tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  4728. begin
  4729. if //(shuffle=nil) and
  4730. (tosize=OS_F32) then
  4731. list.Concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg))
  4732. else
  4733. internalerror(2012100813);
  4734. end;
  4735. procedure tthumb2cgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize: tcgsize; mmreg, intreg: tregister; shuffle: pmmshuffle);
  4736. begin
  4737. if //(shuffle=nil) and
  4738. (fromsize=OS_F32) then
  4739. list.Concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg))
  4740. else
  4741. internalerror(2012100814);
  4742. end;
  4743. procedure tthumb2cg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  4744. var tmpreg: tregister;
  4745. begin
  4746. case op of
  4747. OP_NEG:
  4748. begin
  4749. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4750. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  4751. tmpreg:=cg.getintregister(list,OS_32);
  4752. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,0));
  4753. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,tmpreg,regsrc.reghi));
  4754. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4755. end;
  4756. else
  4757. inherited a_op64_reg_reg(list, op, size, regsrc, regdst);
  4758. end;
  4759. end;
  4760. procedure tthumbcg64farm.a_op64_reg_reg(list: TAsmList; op: TOpCG; size: tcgsize; regsrc, regdst: tregister64);
  4761. begin
  4762. case op of
  4763. OP_NEG:
  4764. begin
  4765. list.concat(taicpu.op_reg_const(A_MOV,regdst.reglo,0));
  4766. list.concat(taicpu.op_reg_const(A_MOV,regdst.reghi,0));
  4767. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4768. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4769. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4770. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4771. end;
  4772. OP_NOT:
  4773. begin
  4774. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  4775. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  4776. end;
  4777. OP_AND,OP_OR,OP_XOR:
  4778. begin
  4779. cg.a_op_reg_reg(list,op,OS_32,regsrc.reglo,regdst.reglo);
  4780. cg.a_op_reg_reg(list,op,OS_32,regsrc.reghi,regdst.reghi);
  4781. end;
  4782. OP_ADD:
  4783. begin
  4784. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4785. list.concat(taicpu.op_reg_reg(A_ADD,regdst.reglo,regsrc.reglo));
  4786. list.concat(taicpu.op_reg_reg(A_ADC,regdst.reghi,regsrc.reghi));
  4787. end;
  4788. OP_SUB:
  4789. begin
  4790. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4791. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4792. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4793. end;
  4794. else
  4795. internalerror(2003083101);
  4796. end;
  4797. end;
  4798. procedure tthumbcg64farm.a_op64_const_reg(list: TAsmList; op: TOpCG; size: tcgsize; value: int64; reg: tregister64);
  4799. var
  4800. tmpreg : tregister;
  4801. begin
  4802. case op of
  4803. OP_AND,OP_OR,OP_XOR:
  4804. begin
  4805. cg.a_op_const_reg(list,op,OS_32,aint(lo(value)),reg.reglo);
  4806. cg.a_op_const_reg(list,op,OS_32,aint(hi(value)),reg.reghi);
  4807. end;
  4808. OP_ADD:
  4809. begin
  4810. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4811. begin
  4812. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4813. list.concat(taicpu.op_reg_const(A_ADD,reg.reglo,aint(lo(value))));
  4814. end
  4815. else
  4816. begin
  4817. tmpreg:=cg.getintregister(list,OS_32);
  4818. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4819. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4820. list.concat(taicpu.op_reg_reg(A_ADD,reg.reglo,tmpreg));
  4821. end;
  4822. tmpreg:=cg.getintregister(list,OS_32);
  4823. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  4824. list.concat(taicpu.op_reg_reg(A_ADC,reg.reghi,tmpreg));
  4825. end;
  4826. OP_SUB:
  4827. begin
  4828. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4829. begin
  4830. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4831. list.concat(taicpu.op_reg_const(A_SUB,reg.reglo,aint(lo(value))))
  4832. end
  4833. else
  4834. begin
  4835. tmpreg:=cg.getintregister(list,OS_32);
  4836. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4837. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4838. list.concat(taicpu.op_reg_reg(A_SUB,reg.reglo,tmpreg));
  4839. end;
  4840. tmpreg:=cg.getintregister(list,OS_32);
  4841. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  4842. list.concat(taicpu.op_reg_reg(A_SBC,reg.reghi,tmpreg));
  4843. end;
  4844. else
  4845. internalerror(2003083101);
  4846. end;
  4847. end;
  4848. procedure create_codegen;
  4849. begin
  4850. if GenerateThumb2Code then
  4851. begin
  4852. cg:=tthumb2cgarm.create;
  4853. cg64:=tthumb2cg64farm.create;
  4854. casmoptimizer:=TCpuThumb2AsmOptimizer;
  4855. end
  4856. else if GenerateThumbCode then
  4857. begin
  4858. cg:=tthumbcgarm.create;
  4859. cg64:=tthumbcg64farm.create;
  4860. // casmoptimizer:=TCpuThumbAsmOptimizer;
  4861. end
  4862. else
  4863. begin
  4864. cg:=tarmcgarm.create;
  4865. cg64:=tarmcg64farm.create;
  4866. casmoptimizer:=TCpuAsmOptimizer;
  4867. end;
  4868. end;
  4869. end.