cgcpu.pas 214 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228322932303231323232333234323532363237323832393240324132423243324432453246324732483249325032513252325332543255325632573258325932603261326232633264326532663267326832693270327132723273327432753276327732783279328032813282328332843285328632873288328932903291329232933294329532963297329832993300330133023303330433053306330733083309331033113312331333143315331633173318331933203321332233233324332533263327332833293330333133323333333433353336333733383339334033413342334333443345334633473348334933503351335233533354335533563357335833593360336133623363336433653366336733683369337033713372337333743375337633773378337933803381338233833384338533863387338833893390339133923393339433953396339733983399340034013402340334043405340634073408340934103411341234133414341534163417341834193420342134223423342434253426342734283429343034313432343334343435343634373438343934403441344234433444344534463447344834493450345134523453345434553456345734583459346034613462346334643465346634673468346934703471347234733474347534763477347834793480348134823483348434853486348734883489349034913492349334943495349634973498349935003501350235033504350535063507350835093510351135123513351435153516351735183519352035213522352335243525352635273528352935303531353235333534353535363537353835393540354135423543354435453546354735483549355035513552355335543555355635573558355935603561356235633564356535663567356835693570357135723573357435753576357735783579358035813582358335843585358635873588358935903591359235933594359535963597359835993600360136023603360436053606360736083609361036113612361336143615361636173618361936203621362236233624362536263627362836293630363136323633363436353636363736383639364036413642364336443645364636473648364936503651365236533654365536563657365836593660366136623663366436653666366736683669367036713672367336743675367636773678367936803681368236833684368536863687368836893690369136923693369436953696369736983699370037013702370337043705370637073708370937103711371237133714371537163717371837193720372137223723372437253726372737283729373037313732373337343735373637373738373937403741374237433744374537463747374837493750375137523753375437553756375737583759376037613762376337643765376637673768376937703771377237733774377537763777377837793780378137823783378437853786378737883789379037913792379337943795379637973798379938003801380238033804380538063807380838093810381138123813381438153816381738183819382038213822382338243825382638273828382938303831383238333834383538363837383838393840384138423843384438453846384738483849385038513852385338543855385638573858385938603861386238633864386538663867386838693870387138723873387438753876387738783879388038813882388338843885388638873888388938903891389238933894389538963897389838993900390139023903390439053906390739083909391039113912391339143915391639173918391939203921392239233924392539263927392839293930393139323933393439353936393739383939394039413942394339443945394639473948394939503951395239533954395539563957395839593960396139623963396439653966396739683969397039713972397339743975397639773978397939803981398239833984398539863987398839893990399139923993399439953996399739983999400040014002400340044005400640074008400940104011401240134014401540164017401840194020402140224023402440254026402740284029403040314032403340344035403640374038403940404041404240434044404540464047404840494050405140524053405440554056405740584059406040614062406340644065406640674068406940704071407240734074407540764077407840794080408140824083408440854086408740884089409040914092409340944095409640974098409941004101410241034104410541064107410841094110411141124113411441154116411741184119412041214122412341244125412641274128412941304131413241334134413541364137413841394140414141424143414441454146414741484149415041514152415341544155415641574158415941604161416241634164416541664167416841694170417141724173417441754176417741784179418041814182418341844185418641874188418941904191419241934194419541964197419841994200420142024203420442054206420742084209421042114212421342144215421642174218421942204221422242234224422542264227422842294230423142324233423442354236423742384239424042414242424342444245424642474248424942504251425242534254425542564257425842594260426142624263426442654266426742684269427042714272427342744275427642774278427942804281428242834284428542864287428842894290429142924293429442954296429742984299430043014302430343044305430643074308430943104311431243134314431543164317431843194320432143224323432443254326432743284329433043314332433343344335433643374338433943404341434243434344434543464347434843494350435143524353435443554356435743584359436043614362436343644365436643674368436943704371437243734374437543764377437843794380438143824383438443854386438743884389439043914392439343944395439643974398439944004401440244034404440544064407440844094410441144124413441444154416441744184419442044214422442344244425442644274428442944304431443244334434443544364437443844394440444144424443444444454446444744484449445044514452445344544455445644574458445944604461446244634464446544664467446844694470447144724473447444754476447744784479448044814482448344844485448644874488448944904491449244934494449544964497449844994500450145024503450445054506450745084509451045114512451345144515451645174518451945204521452245234524452545264527452845294530453145324533453445354536453745384539454045414542454345444545454645474548454945504551455245534554455545564557455845594560456145624563456445654566456745684569457045714572457345744575457645774578457945804581458245834584458545864587458845894590459145924593459445954596459745984599460046014602460346044605460646074608460946104611461246134614461546164617461846194620462146224623462446254626462746284629463046314632463346344635463646374638463946404641464246434644464546464647464846494650465146524653465446554656465746584659466046614662466346644665466646674668466946704671467246734674467546764677467846794680468146824683468446854686468746884689469046914692469346944695469646974698469947004701470247034704470547064707470847094710471147124713471447154716471747184719472047214722472347244725472647274728472947304731473247334734473547364737473847394740474147424743474447454746474747484749475047514752475347544755475647574758475947604761476247634764476547664767476847694770477147724773477447754776477747784779478047814782478347844785478647874788478947904791479247934794479547964797479847994800480148024803480448054806480748084809481048114812481348144815481648174818481948204821482248234824482548264827482848294830483148324833483448354836483748384839484048414842484348444845484648474848484948504851485248534854485548564857485848594860486148624863486448654866486748684869487048714872487348744875487648774878487948804881488248834884488548864887488848894890489148924893489448954896489748984899490049014902490349044905490649074908490949104911491249134914491549164917491849194920492149224923492449254926492749284929493049314932493349344935493649374938493949404941494249434944494549464947494849494950495149524953495449554956495749584959496049614962496349644965496649674968496949704971497249734974497549764977497849794980498149824983498449854986498749884989499049914992499349944995499649974998499950005001500250035004500550065007500850095010501150125013501450155016501750185019502050215022502350245025502650275028502950305031503250335034503550365037503850395040504150425043504450455046504750485049505050515052505350545055505650575058505950605061506250635064506550665067506850695070507150725073507450755076507750785079508050815082508350845085508650875088508950905091509250935094509550965097509850995100510151025103510451055106510751085109511051115112511351145115511651175118511951205121512251235124512551265127512851295130513151325133513451355136513751385139514051415142514351445145514651475148514951505151515251535154515551565157515851595160516151625163516451655166516751685169517051715172517351745175517651775178517951805181518251835184518551865187518851895190519151925193519451955196519751985199520052015202520352045205520652075208520952105211521252135214521552165217521852195220522152225223522452255226522752285229523052315232523352345235523652375238523952405241524252435244524552465247524852495250525152525253525452555256525752585259526052615262526352645265526652675268526952705271527252735274527552765277527852795280528152825283528452855286528752885289529052915292529352945295529652975298529953005301530253035304530553065307530853095310531153125313531453155316531753185319532053215322532353245325532653275328
  1. {
  2. Copyright (c) 2003 by Florian Klaempfl
  3. Member of the Free Pascal development team
  4. This unit implements the code generator for the ARM
  5. This program is free software; you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation; either version 2 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program; if not, write to the Free Software
  15. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  16. ****************************************************************************
  17. }
  18. unit cgcpu;
  19. {$i fpcdefs.inc}
  20. interface
  21. uses
  22. globtype,symtype,symdef,
  23. cgbase,cgutils,cgobj,
  24. aasmbase,aasmcpu,aasmtai,aasmdata,
  25. parabase,
  26. cpubase,cpuinfo,cg64f32,rgcpu;
  27. type
  28. { tbasecgarm is shared between all arm architectures }
  29. tbasecgarm = class(tcg)
  30. { true, if the next arithmetic operation should modify the flags }
  31. cgsetflags : boolean;
  32. procedure a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);override;
  33. procedure a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);override;
  34. procedure a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);override;
  35. procedure a_call_name(list : TAsmList;const s : string; weak: boolean);override;
  36. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  37. { move instructions }
  38. procedure a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);override;
  39. procedure a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);override;
  40. function a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  41. function a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  42. { fpu move instructions }
  43. procedure a_loadfpu_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister); override;
  44. procedure a_loadfpu_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister); override;
  45. procedure a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference); override;
  46. procedure a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);override;
  47. { comparison operations }
  48. procedure a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  49. l : tasmlabel);override;
  50. procedure a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel); override;
  51. procedure a_jmp_name(list : TAsmList;const s : string); override;
  52. procedure a_jmp_always(list : TAsmList;l: tasmlabel); override;
  53. procedure a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel); override;
  54. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  55. procedure g_profilecode(list : TAsmList); override;
  56. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  57. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  58. procedure g_maybe_got_init(list : TAsmList); override;
  59. procedure a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);override;
  60. procedure g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);override;
  61. procedure g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);override;
  62. procedure g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  63. procedure g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  64. procedure g_overflowcheck(list: TAsmList; const l: tlocation; def: tdef); override;
  65. procedure g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);override;
  66. procedure g_save_registers(list : TAsmList);override;
  67. procedure g_restore_registers(list : TAsmList);override;
  68. procedure a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  69. procedure fixref(list : TAsmList;var ref : treference);
  70. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; virtual;
  71. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  72. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  73. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  74. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  75. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  76. procedure a_opmm_reg_reg(list: TAsmList; Op: TOpCG; size : tcgsize;src,dst: tregister;shuffle : pmmshuffle); override;
  77. { Transform unsupported methods into Internal errors }
  78. procedure a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister); override;
  79. { try to generate optimized 32 Bit multiplication, returns true if successful generated }
  80. function try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  81. { clear out potential overflow bits from 8 or 16 bit operations }
  82. { the upper 24/16 bits of a register after an operation }
  83. procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  84. { mla for thumb requires that none of the registers is equal to r13/r15, this method ensures this }
  85. procedure safe_mla(list: TAsmList;op1,op2,op3,op4 : TRegister);
  86. end;
  87. { tcgarm is shared between normal arm and thumb-2 }
  88. tcgarm = class(tbasecgarm)
  89. procedure a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister); override;
  90. procedure a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference); override;
  91. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  92. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  93. size: tcgsize; a: tcgint; src, dst: tregister); override;
  94. procedure a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  95. size: tcgsize; src1, src2, dst: tregister); override;
  96. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  97. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  98. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  99. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  100. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  101. {Multiply two 32-bit registers into lo and hi 32-bit registers}
  102. procedure a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister); override;
  103. end;
  104. { normal arm cg }
  105. tarmcgarm = class(tcgarm)
  106. procedure init_register_allocators;override;
  107. procedure done_register_allocators;override;
  108. end;
  109. { 64 bit cg for all arm flavours }
  110. tbasecg64farm = class(tcg64f32)
  111. end;
  112. { tcg64farm is shared between normal arm and thumb-2 }
  113. tcg64farm = class(tbasecg64farm)
  114. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  115. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  116. procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;
  117. procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  118. procedure a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  119. procedure a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  120. procedure a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);override;
  121. procedure a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);override;
  122. end;
  123. tarmcg64farm = class(tcg64farm)
  124. end;
  125. tthumbcgarm = class(tbasecgarm)
  126. procedure init_register_allocators;override;
  127. procedure done_register_allocators;override;
  128. procedure g_proc_entry(list: TAsmList; localsize: longint; nostackframe: boolean);override;
  129. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  130. procedure a_op_reg_reg(list: TAsmList; Op: TOpCG; size: TCGSize; src,dst: TRegister);override;
  131. procedure a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);override;
  132. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister); override;
  133. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  134. procedure a_load_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const Ref: treference; reg: tregister);override;
  135. procedure a_load_const_reg(list: TAsmList; size: tcgsize; a: tcgint; reg: tregister);override;
  136. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  137. function handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference; override;
  138. end;
  139. tthumbcg64farm = class(tbasecg64farm)
  140. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  141. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  142. end;
  143. tthumb2cgarm = class(tcgarm)
  144. procedure init_register_allocators;override;
  145. procedure done_register_allocators;override;
  146. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  147. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  148. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  149. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  150. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  151. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  152. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  153. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  154. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  155. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; override;
  156. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  157. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  158. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  159. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  160. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  161. end;
  162. tthumb2cg64farm = class(tcg64farm)
  163. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  164. end;
  165. const
  166. OpCmp2AsmCond : Array[topcmp] of TAsmCond = (C_NONE,C_EQ,C_GT,
  167. C_LT,C_GE,C_LE,C_NE,C_LS,C_CC,C_CS,C_HI);
  168. winstackpagesize = 4096;
  169. function get_fpu_postfix(def : tdef) : toppostfix;
  170. procedure create_codegen;
  171. implementation
  172. uses
  173. globals,verbose,systems,cutils,
  174. aopt,aoptcpu,
  175. fmodule,
  176. symconst,symsym,symtable,
  177. tgobj,
  178. procinfo,cpupi,
  179. paramgr;
  180. function get_fpu_postfix(def : tdef) : toppostfix;
  181. begin
  182. if def.typ=floatdef then
  183. begin
  184. case tfloatdef(def).floattype of
  185. s32real:
  186. result:=PF_S;
  187. s64real:
  188. result:=PF_D;
  189. s80real:
  190. result:=PF_E;
  191. else
  192. internalerror(200401272);
  193. end;
  194. end
  195. else
  196. internalerror(200401271);
  197. end;
  198. procedure tarmcgarm.init_register_allocators;
  199. begin
  200. inherited init_register_allocators;
  201. { currently, we always save R14, so we can use it }
  202. if (target_info.system<>system_arm_darwin) then
  203. begin
  204. if assigned(current_procinfo) and (current_procinfo.framepointer<>NR_R11) then
  205. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  206. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  207. RS_R9,RS_R10,RS_R11,RS_R14],first_int_imreg,[])
  208. else
  209. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  210. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  211. RS_R9,RS_R10,RS_R14],first_int_imreg,[])
  212. end
  213. else
  214. { r7 is not available on Darwin, it's used as frame pointer (always,
  215. for backtrace support -- also in gcc/clang -> R11 can be used).
  216. r9 is volatile }
  217. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  218. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R9,RS_R12,RS_R4,RS_R5,RS_R6,RS_R8,
  219. RS_R10,RS_R11,RS_R14],first_int_imreg,[]);
  220. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  221. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  222. { The register allocator currently cannot deal with multiple
  223. non-overlapping subregs per register, so we can only use
  224. half the single precision registers for now (as sub registers of the
  225. double precision ones). }
  226. if current_settings.fputype in [fpu_vfpv3,fpu_vfpv4] then
  227. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  228. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  229. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  230. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  231. ],first_mm_imreg,[])
  232. else
  233. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  234. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15],first_mm_imreg,[]);
  235. end;
  236. procedure tarmcgarm.done_register_allocators;
  237. begin
  238. rg[R_INTREGISTER].free;
  239. rg[R_FPUREGISTER].free;
  240. rg[R_MMREGISTER].free;
  241. inherited done_register_allocators;
  242. end;
  243. procedure tcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  244. var
  245. imm_shift : byte;
  246. l : tasmlabel;
  247. hr : treference;
  248. imm1, imm2: DWord;
  249. begin
  250. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  251. internalerror(2002090902);
  252. if is_shifter_const(a,imm_shift) then
  253. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  254. else if is_shifter_const(not(a),imm_shift) then
  255. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  256. { loading of constants with mov and orr }
  257. else if (split_into_shifter_const(a,imm1, imm2)) then
  258. begin
  259. list.concat(taicpu.op_reg_const(A_MOV,reg, imm1));
  260. list.concat(taicpu.op_reg_reg_const(A_ORR,reg,reg, imm2));
  261. end
  262. { loading of constants with mvn and bic }
  263. else if (split_into_shifter_const(not(a), imm1, imm2)) then
  264. begin
  265. list.concat(taicpu.op_reg_const(A_MVN,reg, imm1));
  266. list.concat(taicpu.op_reg_reg_const(A_BIC,reg,reg, imm2));
  267. end
  268. else
  269. begin
  270. reference_reset(hr,4,[]);
  271. current_asmdata.getjumplabel(l);
  272. cg.a_label(current_procinfo.aktlocaldata,l);
  273. hr.symboldata:=current_procinfo.aktlocaldata.last;
  274. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  275. hr.symbol:=l;
  276. hr.base:=NR_PC;
  277. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  278. end;
  279. end;
  280. procedure tcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  281. var
  282. oppostfix:toppostfix;
  283. usedtmpref: treference;
  284. tmpreg,tmpreg2 : tregister;
  285. so : tshifterop;
  286. dir : integer;
  287. begin
  288. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  289. FromSize := ToSize;
  290. case FromSize of
  291. { signed integer registers }
  292. OS_8:
  293. oppostfix:=PF_B;
  294. OS_S8:
  295. oppostfix:=PF_SB;
  296. OS_16:
  297. oppostfix:=PF_H;
  298. OS_S16:
  299. oppostfix:=PF_SH;
  300. OS_32,
  301. OS_S32:
  302. oppostfix:=PF_None;
  303. else
  304. InternalError(200308297);
  305. end;
  306. if (fromsize=OS_S8) and
  307. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  308. oppostfix:=PF_B;
  309. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize])) or
  310. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  311. (oppostfix in [PF_SH,PF_H])) then
  312. begin
  313. if target_info.endian=endian_big then
  314. dir:=-1
  315. else
  316. dir:=1;
  317. case FromSize of
  318. OS_16,OS_S16:
  319. begin
  320. { only complicated references need an extra loadaddr }
  321. if assigned(ref.symbol) or
  322. (ref.index<>NR_NO) or
  323. (ref.offset<-4095) or
  324. (ref.offset>4094) or
  325. { sometimes the compiler reused registers }
  326. (reg=ref.index) or
  327. (reg=ref.base) then
  328. begin
  329. tmpreg2:=getintregister(list,OS_INT);
  330. a_loadaddr_ref_reg(list,ref,tmpreg2);
  331. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment,ref.volatility);
  332. end
  333. else
  334. usedtmpref:=ref;
  335. if target_info.endian=endian_big then
  336. inc(usedtmpref.offset,1);
  337. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  338. tmpreg:=getintregister(list,OS_INT);
  339. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  340. inc(usedtmpref.offset,dir);
  341. if FromSize=OS_16 then
  342. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  343. else
  344. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  345. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  346. end;
  347. OS_32,OS_S32:
  348. begin
  349. tmpreg:=getintregister(list,OS_INT);
  350. { only complicated references need an extra loadaddr }
  351. if assigned(ref.symbol) or
  352. (ref.index<>NR_NO) or
  353. (ref.offset<-4095) or
  354. (ref.offset>4092) or
  355. { sometimes the compiler reused registers }
  356. (reg=ref.index) or
  357. (reg=ref.base) then
  358. begin
  359. tmpreg2:=getintregister(list,OS_INT);
  360. a_loadaddr_ref_reg(list,ref,tmpreg2);
  361. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment,ref.volatility);
  362. end
  363. else
  364. usedtmpref:=ref;
  365. shifterop_reset(so);so.shiftmode:=SM_LSL;
  366. if ref.alignment=2 then
  367. begin
  368. if target_info.endian=endian_big then
  369. inc(usedtmpref.offset,2);
  370. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  371. inc(usedtmpref.offset,dir*2);
  372. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  373. so.shiftimm:=16;
  374. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  375. end
  376. else
  377. begin
  378. tmpreg2:=getintregister(list,OS_INT);
  379. if target_info.endian=endian_big then
  380. inc(usedtmpref.offset,3);
  381. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  382. inc(usedtmpref.offset,dir);
  383. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  384. inc(usedtmpref.offset,dir);
  385. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg2);
  386. so.shiftimm:=8;
  387. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  388. inc(usedtmpref.offset,dir);
  389. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  390. so.shiftimm:=16;
  391. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg2,so));
  392. so.shiftimm:=24;
  393. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  394. end;
  395. end
  396. else
  397. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  398. end;
  399. end
  400. else
  401. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  402. if (fromsize=OS_S8) and
  403. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  404. a_load_reg_reg(list,OS_S8,OS_32,reg,reg)
  405. else if (fromsize=OS_S8) and (tosize = OS_16) then
  406. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  407. end;
  408. procedure tcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  409. var
  410. hsym : tsym;
  411. href : treference;
  412. paraloc : Pcgparalocation;
  413. shift : byte;
  414. begin
  415. { calculate the parameter info for the procdef }
  416. procdef.init_paraloc_info(callerside);
  417. hsym:=tsym(procdef.parast.Find('self'));
  418. if not(assigned(hsym) and
  419. (hsym.typ=paravarsym)) then
  420. internalerror(200305251);
  421. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  422. while paraloc<>nil do
  423. with paraloc^ do
  424. begin
  425. case loc of
  426. LOC_REGISTER:
  427. begin
  428. if is_shifter_const(ioffset,shift) then
  429. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  430. else
  431. begin
  432. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  433. a_op_reg_reg(list,OP_SUB,size,NR_R12,register);
  434. end;
  435. end;
  436. LOC_REFERENCE:
  437. begin
  438. { offset in the wrapper needs to be adjusted for the stored
  439. return address }
  440. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),sizeof(pint),[]);
  441. if is_shifter_const(ioffset,shift) then
  442. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  443. else
  444. begin
  445. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  446. a_op_reg_ref(list,OP_SUB,size,NR_R12,href);
  447. end;
  448. end
  449. else
  450. internalerror(200309189);
  451. end;
  452. paraloc:=next;
  453. end;
  454. end;
  455. procedure tbasecgarm.a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);
  456. var
  457. ref: treference;
  458. begin
  459. paraloc.check_simple_location;
  460. paramanager.allocparaloc(list,paraloc.location);
  461. case paraloc.location^.loc of
  462. LOC_REGISTER,LOC_CREGISTER:
  463. a_load_const_reg(list,size,a,paraloc.location^.register);
  464. LOC_REFERENCE:
  465. begin
  466. reference_reset(ref,paraloc.alignment,[]);
  467. ref.base:=paraloc.location^.reference.index;
  468. ref.offset:=paraloc.location^.reference.offset;
  469. a_load_const_ref(list,size,a,ref);
  470. end;
  471. else
  472. internalerror(2002081101);
  473. end;
  474. end;
  475. procedure tbasecgarm.a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);
  476. var
  477. tmpref, ref: treference;
  478. location: pcgparalocation;
  479. sizeleft: aint;
  480. begin
  481. location := paraloc.location;
  482. tmpref := r;
  483. sizeleft := paraloc.intsize;
  484. while assigned(location) do
  485. begin
  486. paramanager.allocparaloc(list,location);
  487. case location^.loc of
  488. LOC_REGISTER,LOC_CREGISTER:
  489. a_load_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  490. LOC_REFERENCE:
  491. begin
  492. reference_reset_base(ref,location^.reference.index,location^.reference.offset,paraloc.alignment,[]);
  493. { doubles in softemu mode have a strange order of registers and references }
  494. if location^.size=OS_32 then
  495. g_concatcopy(list,tmpref,ref,4)
  496. else
  497. begin
  498. g_concatcopy(list,tmpref,ref,sizeleft);
  499. if assigned(location^.next) then
  500. internalerror(2005010710);
  501. end;
  502. end;
  503. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  504. case location^.size of
  505. OS_F32, OS_F64:
  506. a_loadfpu_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  507. else
  508. internalerror(2002072801);
  509. end;
  510. LOC_VOID:
  511. begin
  512. // nothing to do
  513. end;
  514. else
  515. internalerror(2002081103);
  516. end;
  517. inc(tmpref.offset,tcgsize2size[location^.size]);
  518. dec(sizeleft,tcgsize2size[location^.size]);
  519. location := location^.next;
  520. end;
  521. end;
  522. procedure tbasecgarm.a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);
  523. var
  524. ref: treference;
  525. tmpreg: tregister;
  526. begin
  527. paraloc.check_simple_location;
  528. paramanager.allocparaloc(list,paraloc.location);
  529. case paraloc.location^.loc of
  530. LOC_REGISTER,LOC_CREGISTER:
  531. a_loadaddr_ref_reg(list,r,paraloc.location^.register);
  532. LOC_REFERENCE:
  533. begin
  534. reference_reset(ref,paraloc.alignment,[]);
  535. ref.base := paraloc.location^.reference.index;
  536. ref.offset := paraloc.location^.reference.offset;
  537. tmpreg := getintregister(list,OS_ADDR);
  538. a_loadaddr_ref_reg(list,r,tmpreg);
  539. a_load_reg_ref(list,OS_ADDR,OS_ADDR,tmpreg,ref);
  540. end;
  541. else
  542. internalerror(2002080701);
  543. end;
  544. end;
  545. procedure tbasecgarm.a_call_name(list : TAsmList;const s : string; weak: boolean);
  546. var
  547. branchopcode: tasmop;
  548. r : treference;
  549. sym : TAsmSymbol;
  550. begin
  551. { check not really correct: should only be used for non-Thumb cpus }
  552. // if (CPUARM_HAS_BLX_LABEL in cpu_capabilities[current_settings.cputype]) and
  553. // { WinCE GNU AS (not sure if this applies in general) does not support BLX imm }
  554. // (target_info.system<>system_arm_wince) then
  555. // branchopcode:=A_BLX
  556. // else
  557. { use always BL as newer binutils do not translate blx apparently
  558. generating BL is also what clang and gcc do by default }
  559. branchopcode:=A_BL;
  560. if not(weak) then
  561. sym:=current_asmdata.RefAsmSymbol(s,AT_FUNCTION)
  562. else
  563. sym:=current_asmdata.WeakRefAsmSymbol(s,AT_FUNCTION);
  564. reference_reset_symbol(r,sym,0,sizeof(pint),[]);
  565. if (tf_pic_uses_got in target_info.flags) and
  566. (cs_create_pic in current_settings.moduleswitches) then
  567. begin
  568. r.refaddr:=addr_pic
  569. end
  570. else
  571. r.refaddr:=addr_full;
  572. list.concat(taicpu.op_ref(branchopcode,r));
  573. {
  574. the compiler does not properly set this flag anymore in pass 1, and
  575. for now we only need it after pass 2 (I hope) (JM)
  576. if not(pi_do_call in current_procinfo.flags) then
  577. internalerror(2003060703);
  578. }
  579. include(current_procinfo.flags,pi_do_call);
  580. end;
  581. procedure tbasecgarm.a_call_reg(list : TAsmList;reg: tregister);
  582. begin
  583. { check not really correct: should only be used for non-Thumb cpus }
  584. if not(CPUARM_HAS_BLX in cpu_capabilities[current_settings.cputype]) then
  585. begin
  586. list.concat(taicpu.op_reg_reg(A_MOV,NR_R14,NR_PC));
  587. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,reg));
  588. end
  589. else
  590. list.concat(taicpu.op_reg(A_BLX, reg));
  591. {
  592. the compiler does not properly set this flag anymore in pass 1, and
  593. for now we only need it after pass 2 (I hope) (JM)
  594. if not(pi_do_call in current_procinfo.flags) then
  595. internalerror(2003060703);
  596. }
  597. include(current_procinfo.flags,pi_do_call);
  598. end;
  599. procedure tcgarm.a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister);
  600. begin
  601. a_op_const_reg_reg(list,op,size,a,reg,reg);
  602. end;
  603. procedure tcgarm.a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference);
  604. var
  605. tmpreg,tmpresreg : tregister;
  606. tmpref : treference;
  607. begin
  608. tmpreg:=getintregister(list,size);
  609. tmpresreg:=getintregister(list,size);
  610. tmpref:=a_internal_load_ref_reg(list,size,size,ref,tmpreg);
  611. a_op_const_reg_reg(list,op,size,a,tmpreg,tmpresreg);
  612. a_load_reg_ref(list,size,size,tmpresreg,tmpref);
  613. end;
  614. procedure tcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  615. var
  616. so : tshifterop;
  617. begin
  618. if op = OP_NEG then
  619. begin
  620. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,src,0));
  621. maybeadjustresult(list,OP_NEG,size,dst);
  622. end
  623. else if op = OP_NOT then
  624. begin
  625. if size in [OS_8, OS_16, OS_S8, OS_S16] then
  626. begin
  627. shifterop_reset(so);
  628. so.shiftmode:=SM_LSL;
  629. if size in [OS_8, OS_S8] then
  630. so.shiftimm:=24
  631. else
  632. so.shiftimm:=16;
  633. list.concat(taicpu.op_reg_reg_shifterop(A_MVN,dst,src,so));
  634. {Using a shift here allows this to be folded into another instruction}
  635. if size in [OS_S8, OS_S16] then
  636. so.shiftmode:=SM_ASR
  637. else
  638. so.shiftmode:=SM_LSR;
  639. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  640. end
  641. else
  642. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  643. end
  644. else
  645. a_op_reg_reg_reg(list,op,size,src,dst,dst);
  646. end;
  647. const
  648. op_reg_reg_opcg2asmop: array[TOpCG] of tasmop =
  649. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  650. A_NONE,A_NONE,A_NONE,A_SUB,A_EOR,A_NONE,A_NONE);
  651. op_reg_opcg2asmop: array[TOpCG] of tasmop =
  652. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  653. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  654. op_reg_postfix: array[TOpCG] of TOpPostfix =
  655. (PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,
  656. PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None);
  657. procedure tcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  658. size: tcgsize; a: tcgint; src, dst: tregister);
  659. var
  660. ovloc : tlocation;
  661. begin
  662. a_op_const_reg_reg_checkoverflow(list,op,size,a,src,dst,false,ovloc);
  663. end;
  664. procedure tcgarm.a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  665. size: tcgsize; src1, src2, dst: tregister);
  666. var
  667. ovloc : tlocation;
  668. begin
  669. a_op_reg_reg_reg_checkoverflow(list,op,size,src1,src2,dst,false,ovloc);
  670. end;
  671. function opshift2shiftmode(op: TOpCg): tshiftmode;
  672. begin
  673. case op of
  674. OP_SHL: Result:=SM_LSL;
  675. OP_SHR: Result:=SM_LSR;
  676. OP_ROR: Result:=SM_ROR;
  677. OP_ROL: Result:=SM_ROR;
  678. OP_SAR: Result:=SM_ASR;
  679. else internalerror(2012070501);
  680. end
  681. end;
  682. function tbasecgarm.try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  683. var
  684. multiplier : dword;
  685. power : longint;
  686. shifterop : tshifterop;
  687. bitsset : byte;
  688. negative : boolean;
  689. first : boolean;
  690. b,
  691. cycles : byte;
  692. maxeffort : byte;
  693. begin
  694. result:=true;
  695. cycles:=0;
  696. negative:=a<0;
  697. shifterop.rs:=NR_NO;
  698. shifterop.shiftmode:=SM_LSL;
  699. if negative then
  700. inc(cycles);
  701. multiplier:=dword(abs(a));
  702. bitsset:=popcnt(multiplier and $fffffffe);
  703. { heuristics to estimate how much instructions are reasonable to replace the mul,
  704. this is currently based on XScale timings }
  705. { in the simplest case, we need a mov to load the constant and a mul to carry out the
  706. actual multiplication, this requires min. 1+4 cycles
  707. because the first shift imm. might cause a stall and because we need more instructions
  708. when replacing the mul we generate max. 3 instructions to replace this mul }
  709. maxeffort:=3;
  710. { if the constant is not a shifter op, we need either some mov/mvn/bic/or sequence or
  711. a ldr, so generating one more operation to replace this is beneficial }
  712. if not(is_shifter_const(dword(a),b)) and not(is_shifter_const(not(dword(a)),b)) then
  713. inc(maxeffort);
  714. { if the upper 5 bits are all set or clear, mul is one cycle faster }
  715. if ((dword(a) and $f8000000)=0) or ((dword(a) and $f8000000)=$f8000000) then
  716. dec(maxeffort);
  717. { if the upper 17 bits are all set or clear, mul is another cycle faster }
  718. if ((dword(a) and $ffff8000)=0) or ((dword(a) and $ffff8000)=$ffff8000) then
  719. dec(maxeffort);
  720. { most simple cases }
  721. if a=1 then
  722. a_load_reg_reg(list,OS_32,OS_32,src,dst)
  723. else if a=0 then
  724. a_load_const_reg(list,OS_32,0,dst)
  725. else if a=-1 then
  726. a_op_reg_reg(list,OP_NEG,OS_32,src,dst)
  727. { add up ?
  728. basically, one add is needed for each bit being set in the constant factor
  729. however, the least significant bit is for free, it can be hidden in the initial
  730. instruction
  731. }
  732. else if (bitsset+cycles<=maxeffort) and
  733. (bitsset<=popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)) then
  734. begin
  735. first:=true;
  736. while multiplier<>0 do
  737. begin
  738. shifterop.shiftimm:=BsrDWord(multiplier);
  739. if odd(multiplier) then
  740. begin
  741. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,shifterop));
  742. dec(multiplier);
  743. end
  744. else
  745. if first then
  746. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  747. else
  748. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,src,shifterop));
  749. first:=false;
  750. dec(multiplier,1 shl shifterop.shiftimm);
  751. end;
  752. if negative then
  753. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  754. end
  755. { subtract from the next greater power of two? }
  756. else if popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)+cycles+1<=maxeffort then
  757. begin
  758. first:=true;
  759. while multiplier<>0 do
  760. begin
  761. if first then
  762. begin
  763. multiplier:=(1 shl power)-multiplier;
  764. shifterop.shiftimm:=power;
  765. end
  766. else
  767. shifterop.shiftimm:=BsrDWord(multiplier);
  768. if odd(multiplier) then
  769. begin
  770. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,shifterop));
  771. dec(multiplier);
  772. end
  773. else
  774. if first then
  775. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  776. else
  777. begin
  778. list.concat(taicpu.op_reg_reg_reg_shifterop(A_SUB,dst,dst,src,shifterop));
  779. dec(multiplier,1 shl shifterop.shiftimm);
  780. end;
  781. first:=false;
  782. end;
  783. if negative then
  784. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  785. end
  786. else
  787. result:=false;
  788. end;
  789. procedure tcgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  790. var
  791. shift, lsb, width : byte;
  792. tmpreg : tregister;
  793. so : tshifterop;
  794. l1 : longint;
  795. imm1, imm2: DWord;
  796. begin
  797. optimize_op_const(size, op, a);
  798. case op of
  799. OP_NONE:
  800. begin
  801. if src <> dst then
  802. a_load_reg_reg(list, size, size, src, dst);
  803. exit;
  804. end;
  805. OP_MOVE:
  806. begin
  807. a_load_const_reg(list, size, a, dst);
  808. exit;
  809. end;
  810. end;
  811. ovloc.loc:=LOC_VOID;
  812. if {$ifopt R+}(a<>-2147483648) and{$endif} not setflags and is_shifter_const(-a,shift) then
  813. case op of
  814. OP_ADD:
  815. begin
  816. op:=OP_SUB;
  817. a:=aint(dword(-a));
  818. end;
  819. OP_SUB:
  820. begin
  821. op:=OP_ADD;
  822. a:=aint(dword(-a));
  823. end
  824. end;
  825. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  826. case op of
  827. OP_NEG,OP_NOT:
  828. internalerror(200308281);
  829. OP_SHL,
  830. OP_SHR,
  831. OP_ROL,
  832. OP_ROR,
  833. OP_SAR:
  834. begin
  835. if a>32 then
  836. internalerror(200308294);
  837. shifterop_reset(so);
  838. so.shiftmode:=opshift2shiftmode(op);
  839. if op = OP_ROL then
  840. so.shiftimm:=32-a
  841. else
  842. so.shiftimm:=a;
  843. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  844. end;
  845. else
  846. {if (op in [OP_SUB, OP_ADD]) and
  847. ((a < 0) or
  848. (a > 4095)) then
  849. begin
  850. tmpreg:=getintregister(list,size);
  851. list.concat(taicpu.op_reg_const(A_MOVT, tmpreg, (a shr 16) and $FFFF));
  852. list.concat(taicpu.op_reg_const(A_MOV, tmpreg, a and $FFFF));
  853. list.concat(setoppostfix(taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))
  854. ));
  855. end
  856. else}
  857. begin
  858. if cgsetflags or setflags then
  859. a_reg_alloc(list,NR_DEFAULTFLAGS);
  860. list.concat(setoppostfix(
  861. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  862. end;
  863. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  864. begin
  865. ovloc.loc:=LOC_FLAGS;
  866. case op of
  867. OP_ADD:
  868. ovloc.resflags:=F_CS;
  869. OP_SUB:
  870. ovloc.resflags:=F_CC;
  871. end;
  872. end;
  873. end
  874. else
  875. begin
  876. { there could be added some more sophisticated optimizations }
  877. if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  878. a_op_reg_reg(list,OP_NEG,size,src,dst)
  879. { we do this here instead in the peephole optimizer because
  880. it saves us a register }
  881. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  882. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  883. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  884. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  885. begin
  886. if l1>32 then{roozbeh does this ever happen?}
  887. internalerror(200308296);
  888. shifterop_reset(so);
  889. so.shiftmode:=SM_LSL;
  890. so.shiftimm:=l1;
  891. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  892. end
  893. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  894. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  895. begin
  896. if l1>32 then{does this ever happen?}
  897. internalerror(201205181);
  898. shifterop_reset(so);
  899. so.shiftmode:=SM_LSL;
  900. so.shiftimm:=l1;
  901. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  902. end
  903. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  904. begin
  905. { nothing to do on success }
  906. end
  907. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  908. broader range of shifterconstants.}
  909. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  910. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  911. { Doing two shifts instead of two bics might allow the peephole optimizer to fold the second shift
  912. into the following instruction}
  913. else if (op = OP_AND) and
  914. is_continuous_mask(a, lsb, width) and
  915. ((lsb = 0) or ((lsb + width) = 32)) then
  916. begin
  917. shifterop_reset(so);
  918. if (width = 16) and
  919. (lsb = 0) and
  920. (current_settings.cputype >= cpu_armv6) then
  921. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  922. else if (width = 8) and
  923. (lsb = 0) and
  924. (current_settings.cputype >= cpu_armv6) then
  925. list.concat(taicpu.op_reg_reg(A_UXTB,dst,src))
  926. else if lsb = 0 then
  927. begin
  928. so.shiftmode:=SM_LSL;
  929. so.shiftimm:=32-width;
  930. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  931. so.shiftmode:=SM_LSR;
  932. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  933. end
  934. else
  935. begin
  936. so.shiftmode:=SM_LSR;
  937. so.shiftimm:=lsb;
  938. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  939. so.shiftmode:=SM_LSL;
  940. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  941. end;
  942. end
  943. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  944. begin
  945. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,imm1));
  946. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  947. end
  948. else if (op in [OP_ADD, OP_SUB, OP_OR, OP_XOR]) and
  949. not(cgsetflags or setflags) and
  950. split_into_shifter_const(a, imm1, imm2) then
  951. begin
  952. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,imm1));
  953. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  954. end
  955. else
  956. begin
  957. tmpreg:=getintregister(list,size);
  958. a_load_const_reg(list,size,a,tmpreg);
  959. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  960. end;
  961. end;
  962. maybeadjustresult(list,op,size,dst);
  963. end;
  964. procedure tcgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  965. var
  966. so : tshifterop;
  967. tmpreg,overflowreg : tregister;
  968. asmop : tasmop;
  969. begin
  970. ovloc.loc:=LOC_VOID;
  971. case op of
  972. OP_NEG,OP_NOT,
  973. OP_DIV,OP_IDIV:
  974. internalerror(200308283);
  975. OP_SHL,
  976. OP_SHR,
  977. OP_SAR,
  978. OP_ROR:
  979. begin
  980. if (op = OP_ROR) and not(size in [OS_32,OS_S32]) then
  981. internalerror(2008072801);
  982. shifterop_reset(so);
  983. so.rs:=src1;
  984. so.shiftmode:=opshift2shiftmode(op);
  985. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  986. end;
  987. OP_ROL:
  988. begin
  989. if not(size in [OS_32,OS_S32]) then
  990. internalerror(2008072801);
  991. { simulate ROL by ror'ing 32-value }
  992. tmpreg:=getintregister(list,OS_32);
  993. list.concat(taicpu.op_reg_reg_const(A_RSB,tmpreg,src1, 32));
  994. shifterop_reset(so);
  995. so.rs:=tmpreg;
  996. so.shiftmode:=SM_ROR;
  997. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  998. end;
  999. OP_IMUL,
  1000. OP_MUL:
  1001. begin
  1002. if (cgsetflags or setflags) and
  1003. (CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype]) then
  1004. begin
  1005. overflowreg:=getintregister(list,size);
  1006. if op=OP_IMUL then
  1007. asmop:=A_SMULL
  1008. else
  1009. asmop:=A_UMULL;
  1010. { the arm doesn't allow that rd and rm are the same }
  1011. if dst=src2 then
  1012. begin
  1013. if dst<>src1 then
  1014. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  1015. else
  1016. begin
  1017. tmpreg:=getintregister(list,size);
  1018. a_load_reg_reg(list,size,size,src2,dst);
  1019. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  1020. end;
  1021. end
  1022. else
  1023. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  1024. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1025. if op=OP_IMUL then
  1026. begin
  1027. shifterop_reset(so);
  1028. so.shiftmode:=SM_ASR;
  1029. so.shiftimm:=31;
  1030. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  1031. end
  1032. else
  1033. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  1034. ovloc.loc:=LOC_FLAGS;
  1035. ovloc.resflags:=F_NE;
  1036. end
  1037. else
  1038. begin
  1039. { the arm doesn't allow that rd and rm are the same }
  1040. if dst=src2 then
  1041. begin
  1042. if dst<>src1 then
  1043. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  1044. else
  1045. begin
  1046. tmpreg:=getintregister(list,size);
  1047. a_load_reg_reg(list,size,size,src2,dst);
  1048. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  1049. end;
  1050. end
  1051. else
  1052. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  1053. end;
  1054. end;
  1055. else
  1056. begin
  1057. if cgsetflags or setflags then
  1058. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1059. list.concat(setoppostfix(
  1060. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  1061. end;
  1062. end;
  1063. maybeadjustresult(list,op,size,dst);
  1064. end;
  1065. procedure tcgarm.a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister);
  1066. var
  1067. asmop: tasmop;
  1068. begin
  1069. if CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype] then
  1070. begin
  1071. list.concat(tai_comment.create(strpnew('tcgarm.a_mul_reg_reg_pair called')));
  1072. case size of
  1073. OS_32: asmop:=A_UMULL;
  1074. OS_S32: asmop:=A_SMULL;
  1075. else
  1076. InternalError(2014060802);
  1077. end;
  1078. { The caller might omit dstlo or dsthi, when he is not interested in it, we still
  1079. need valid registers everywhere. In case of dsthi = NR_NO we could fall back to
  1080. 32x32=32 bit multiplication}
  1081. if (dstlo = NR_NO) then
  1082. dstlo:=getintregister(list,size);
  1083. if (dsthi = NR_NO) then
  1084. dsthi:=getintregister(list,size);
  1085. list.concat(taicpu.op_reg_reg_reg_reg(asmop, dstlo, dsthi, src1,src2));
  1086. end
  1087. else if dsthi=NR_NO then
  1088. begin
  1089. if (dstlo = NR_NO) then
  1090. dstlo:=getintregister(list,size);
  1091. list.concat(taicpu.op_reg_reg_reg(A_MUL, dstlo, src1,src2));
  1092. end
  1093. else
  1094. begin
  1095. internalerror(2015083022);
  1096. end;
  1097. end;
  1098. function tbasecgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  1099. var
  1100. tmpreg1,tmpreg2 : tregister;
  1101. begin
  1102. tmpreg1:=NR_NO;
  1103. { Be sure to have a base register }
  1104. if (ref.base=NR_NO) then
  1105. begin
  1106. if ref.shiftmode<>SM_None then
  1107. internalerror(2014020701);
  1108. ref.base:=ref.index;
  1109. ref.index:=NR_NO;
  1110. end;
  1111. { absolute symbols can't be handled directly, we've to store the symbol reference
  1112. in the text segment and access it pc relative
  1113. For now, we assume that references where base or index equals to PC are already
  1114. relative, all other references are assumed to be absolute and thus they need
  1115. to be handled extra.
  1116. A proper solution would be to change refoptions to a set and store the information
  1117. if the symbol is absolute or relative there.
  1118. }
  1119. if (assigned(ref.symbol) and
  1120. not(is_pc(ref.base)) and
  1121. not(is_pc(ref.index))
  1122. ) or
  1123. { [#xxx] isn't a valid address operand }
  1124. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  1125. (ref.offset<-4095) or
  1126. (ref.offset>4095) or
  1127. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  1128. ((ref.offset<-255) or
  1129. (ref.offset>255)
  1130. )
  1131. ) or
  1132. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1133. ((ref.offset<-1020) or
  1134. (ref.offset>1020) or
  1135. ((abs(ref.offset) mod 4)<>0)
  1136. )
  1137. ) or
  1138. ((GenerateThumbCode) and
  1139. (((oppostfix in [PF_SB,PF_SH]) and (ref.offset<>0)) or
  1140. ((oppostfix=PF_None) and ((ref.offset<0) or ((ref.base<>NR_STACK_POINTER_REG) and (ref.offset>124)) or
  1141. ((ref.base=NR_STACK_POINTER_REG) and (ref.offset>1020)) or ((ref.offset mod 4)<>0))) or
  1142. ((oppostfix=PF_H) and ((ref.offset<0) or (ref.offset>62) or ((ref.offset mod 2)<>0) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0)))) or
  1143. ((oppostfix=PF_B) and ((ref.offset<0) or (ref.offset>31) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0))))
  1144. )
  1145. ) then
  1146. begin
  1147. fixref(list,ref);
  1148. end;
  1149. if GenerateThumbCode then
  1150. begin
  1151. { certain thumb load require base and index }
  1152. if (oppostfix in [PF_SB,PF_SH]) and
  1153. (ref.base<>NR_NO) and (ref.index=NR_NO) then
  1154. begin
  1155. tmpreg1:=getintregister(list,OS_ADDR);
  1156. a_load_const_reg(list,OS_ADDR,0,tmpreg1);
  1157. ref.index:=tmpreg1;
  1158. end;
  1159. { "hi" registers cannot be used as base or index }
  1160. if (getsupreg(ref.base) in [RS_R8..RS_R12,RS_R14]) or
  1161. ((ref.base=NR_R13) and (ref.index<>NR_NO)) then
  1162. begin
  1163. tmpreg1:=getintregister(list,OS_ADDR);
  1164. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.base,tmpreg1);
  1165. ref.base:=tmpreg1;
  1166. end;
  1167. if getsupreg(ref.index) in [RS_R8..RS_R14] then
  1168. begin
  1169. tmpreg1:=getintregister(list,OS_ADDR);
  1170. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.index,tmpreg1);
  1171. ref.index:=tmpreg1;
  1172. end;
  1173. end;
  1174. { fold if there is base, index and offset, however, don't fold
  1175. for vfp memory instructions because we later fold the index }
  1176. if not((op in [A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1177. (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  1178. begin
  1179. if tmpreg1<>NR_NO then
  1180. begin
  1181. tmpreg2:=getintregister(list,OS_ADDR);
  1182. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg1,tmpreg2);
  1183. tmpreg1:=tmpreg2;
  1184. end
  1185. else
  1186. begin
  1187. tmpreg1:=getintregister(list,OS_ADDR);
  1188. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg1);
  1189. ref.base:=tmpreg1;
  1190. end;
  1191. ref.offset:=0;
  1192. end;
  1193. { floating point operations have only limited references
  1194. we expect here, that a base is already set }
  1195. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  1196. begin
  1197. if ref.shiftmode<>SM_none then
  1198. internalerror(200309121);
  1199. if tmpreg1<>NR_NO then
  1200. begin
  1201. if ref.base=tmpreg1 then
  1202. begin
  1203. if ref.signindex<0 then
  1204. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,tmpreg1,ref.index))
  1205. else
  1206. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,tmpreg1,ref.index));
  1207. ref.index:=NR_NO;
  1208. end
  1209. else
  1210. begin
  1211. if ref.index<>tmpreg1 then
  1212. internalerror(200403161);
  1213. if ref.signindex<0 then
  1214. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,ref.base,tmpreg1))
  1215. else
  1216. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,tmpreg1));
  1217. ref.base:=tmpreg1;
  1218. ref.index:=NR_NO;
  1219. end;
  1220. end
  1221. else
  1222. begin
  1223. tmpreg1:=getintregister(list,OS_ADDR);
  1224. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,ref.index));
  1225. ref.base:=tmpreg1;
  1226. ref.index:=NR_NO;
  1227. end;
  1228. end;
  1229. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  1230. Result := ref;
  1231. end;
  1232. procedure tbasecgarm.a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);
  1233. var
  1234. oppostfix:toppostfix;
  1235. usedtmpref: treference;
  1236. tmpreg : tregister;
  1237. dir : integer;
  1238. begin
  1239. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  1240. FromSize := ToSize;
  1241. case ToSize of
  1242. { signed integer registers }
  1243. OS_8,
  1244. OS_S8:
  1245. oppostfix:=PF_B;
  1246. OS_16,
  1247. OS_S16:
  1248. oppostfix:=PF_H;
  1249. OS_32,
  1250. OS_S32,
  1251. { for vfp value stored in integer register }
  1252. OS_F32:
  1253. oppostfix:=PF_None;
  1254. else
  1255. InternalError(200308299);
  1256. end;
  1257. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[tosize])) or
  1258. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  1259. (oppostfix =PF_H)) then
  1260. begin
  1261. if target_info.endian=endian_big then
  1262. dir:=-1
  1263. else
  1264. dir:=1;
  1265. case FromSize of
  1266. OS_16,OS_S16:
  1267. begin
  1268. tmpreg:=getintregister(list,OS_INT);
  1269. usedtmpref:=ref;
  1270. if target_info.endian=endian_big then
  1271. inc(usedtmpref.offset,1);
  1272. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1273. inc(usedtmpref.offset,dir);
  1274. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1275. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1276. end;
  1277. OS_32,OS_S32:
  1278. begin
  1279. tmpreg:=getintregister(list,OS_INT);
  1280. usedtmpref:=ref;
  1281. if ref.alignment=2 then
  1282. begin
  1283. if target_info.endian=endian_big then
  1284. inc(usedtmpref.offset,2);
  1285. usedtmpref:=a_internal_load_reg_ref(list,OS_16,OS_16,reg,usedtmpref);
  1286. a_op_const_reg_reg(list,OP_SHR,OS_INT,16,reg,tmpreg);
  1287. inc(usedtmpref.offset,dir*2);
  1288. a_internal_load_reg_ref(list,OS_16,OS_16,tmpreg,usedtmpref);
  1289. end
  1290. else
  1291. begin
  1292. if target_info.endian=endian_big then
  1293. inc(usedtmpref.offset,3);
  1294. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1295. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1296. inc(usedtmpref.offset,dir);
  1297. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1298. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1299. inc(usedtmpref.offset,dir);
  1300. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1301. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1302. inc(usedtmpref.offset,dir);
  1303. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1304. end;
  1305. end
  1306. else
  1307. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1308. end;
  1309. end
  1310. else
  1311. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1312. end;
  1313. function tbasecgarm.a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  1314. var
  1315. oppostfix:toppostfix;
  1316. href: treference;
  1317. tmpreg: TRegister;
  1318. begin
  1319. case ToSize of
  1320. { signed integer registers }
  1321. OS_8,
  1322. OS_S8:
  1323. oppostfix:=PF_B;
  1324. OS_16,
  1325. OS_S16:
  1326. oppostfix:=PF_H;
  1327. OS_32,
  1328. OS_S32:
  1329. oppostfix:=PF_None;
  1330. else
  1331. InternalError(2003082910);
  1332. end;
  1333. if (tosize in [OS_S16,OS_16]) and
  1334. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1335. begin
  1336. result:=handle_load_store(list,A_STR,PF_B,reg,ref);
  1337. tmpreg:=getintregister(list,OS_INT);
  1338. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1339. href:=result;
  1340. inc(href.offset);
  1341. handle_load_store(list,A_STR,PF_B,tmpreg,href);
  1342. end
  1343. else
  1344. result:=handle_load_store(list,A_STR,oppostfix,reg,ref);
  1345. end;
  1346. function tbasecgarm.a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  1347. var
  1348. oppostfix:toppostfix;
  1349. so: tshifterop;
  1350. tmpreg: TRegister;
  1351. href: treference;
  1352. begin
  1353. case FromSize of
  1354. { signed integer registers }
  1355. OS_8:
  1356. oppostfix:=PF_B;
  1357. OS_S8:
  1358. oppostfix:=PF_SB;
  1359. OS_16:
  1360. oppostfix:=PF_H;
  1361. OS_S16:
  1362. oppostfix:=PF_SH;
  1363. OS_32,
  1364. OS_S32:
  1365. oppostfix:=PF_None;
  1366. else
  1367. InternalError(200308291);
  1368. end;
  1369. if (tosize=OS_S8) and
  1370. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1371. begin
  1372. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1373. a_load_reg_reg(list,OS_S8,OS_32,reg,reg);
  1374. end
  1375. else if (tosize in [OS_S16,OS_16]) and
  1376. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1377. begin
  1378. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1379. tmpreg:=getintregister(list,OS_INT);
  1380. href:=result;
  1381. inc(href.offset);
  1382. handle_load_store(list,A_LDR,PF_B,tmpreg,href);
  1383. shifterop_reset(so);
  1384. so.shiftmode:=SM_LSL;
  1385. so.shiftimm:=8;
  1386. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  1387. end
  1388. else
  1389. result:=handle_load_store(list,A_LDR,oppostfix,reg,ref);
  1390. end;
  1391. procedure tbasecgarm.a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);
  1392. var
  1393. so : tshifterop;
  1394. procedure do_shift(shiftmode : tshiftmode; shiftimm : byte; reg : tregister);
  1395. begin
  1396. if GenerateThumbCode then
  1397. begin
  1398. case shiftmode of
  1399. SM_ASR:
  1400. a_op_const_reg_reg(list,OP_SAR,OS_32,shiftimm,reg,reg2);
  1401. SM_LSR:
  1402. a_op_const_reg_reg(list,OP_SHR,OS_32,shiftimm,reg,reg2);
  1403. SM_LSL:
  1404. a_op_const_reg_reg(list,OP_SHL,OS_32,shiftimm,reg,reg2);
  1405. else
  1406. internalerror(2013090301);
  1407. end;
  1408. end
  1409. else
  1410. begin
  1411. so.shiftmode:=shiftmode;
  1412. so.shiftimm:=shiftimm;
  1413. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,reg2,reg,so));
  1414. end;
  1415. end;
  1416. var
  1417. instr: taicpu;
  1418. conv_done: boolean;
  1419. begin
  1420. if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then
  1421. internalerror(2002090901);
  1422. conv_done:=false;
  1423. if tosize<>fromsize then
  1424. begin
  1425. shifterop_reset(so);
  1426. conv_done:=true;
  1427. if tcgsize2size[tosize]<=tcgsize2size[fromsize] then
  1428. fromsize:=tosize;
  1429. if current_settings.cputype<cpu_armv6 then
  1430. case fromsize of
  1431. OS_8:
  1432. if GenerateThumbCode then
  1433. a_op_const_reg_reg(list,OP_AND,OS_32,$ff,reg1,reg2)
  1434. else
  1435. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1436. OS_S8:
  1437. begin
  1438. do_shift(SM_LSL,24,reg1);
  1439. if tosize=OS_16 then
  1440. begin
  1441. do_shift(SM_ASR,8,reg2);
  1442. do_shift(SM_LSR,16,reg2);
  1443. end
  1444. else
  1445. do_shift(SM_ASR,24,reg2);
  1446. end;
  1447. OS_16:
  1448. begin
  1449. do_shift(SM_LSL,16,reg1);
  1450. do_shift(SM_LSR,16,reg2);
  1451. end;
  1452. OS_S16:
  1453. begin
  1454. do_shift(SM_LSL,16,reg1);
  1455. do_shift(SM_ASR,16,reg2)
  1456. end;
  1457. else
  1458. conv_done:=false;
  1459. end
  1460. else
  1461. case fromsize of
  1462. OS_8:
  1463. if GenerateThumbCode then
  1464. list.concat(taicpu.op_reg_reg(A_UXTB,reg2,reg1))
  1465. else
  1466. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1467. OS_S8:
  1468. begin
  1469. if tosize=OS_16 then
  1470. begin
  1471. so.shiftmode:=SM_ROR;
  1472. so.shiftimm:=16;
  1473. list.concat(taicpu.op_reg_reg_shifterop(A_SXTB16,reg2,reg1,so));
  1474. do_shift(SM_LSR,16,reg2);
  1475. end
  1476. else
  1477. list.concat(taicpu.op_reg_reg(A_SXTB,reg2,reg1));
  1478. end;
  1479. OS_16:
  1480. list.concat(taicpu.op_reg_reg(A_UXTH,reg2,reg1));
  1481. OS_S16:
  1482. list.concat(taicpu.op_reg_reg(A_SXTH,reg2,reg1));
  1483. else
  1484. conv_done:=false;
  1485. end
  1486. end;
  1487. if not conv_done and (reg1<>reg2) then
  1488. begin
  1489. { same size, only a register mov required }
  1490. instr:=taicpu.op_reg_reg(A_MOV,reg2,reg1);
  1491. list.Concat(instr);
  1492. { Notify the register allocator that we have written a move instruction so
  1493. it can try to eliminate it. }
  1494. add_move_instruction(instr);
  1495. end;
  1496. end;
  1497. procedure tbasecgarm.a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);
  1498. var
  1499. href,href2 : treference;
  1500. hloc : pcgparalocation;
  1501. begin
  1502. href:=ref;
  1503. hloc:=paraloc.location;
  1504. while assigned(hloc) do
  1505. begin
  1506. case hloc^.loc of
  1507. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  1508. begin
  1509. paramanager.allocparaloc(list,paraloc.location);
  1510. a_loadfpu_ref_reg(list,size,size,ref,hloc^.register);
  1511. end;
  1512. LOC_REGISTER :
  1513. case hloc^.size of
  1514. OS_32,
  1515. OS_F32:
  1516. begin
  1517. paramanager.allocparaloc(list,paraloc.location);
  1518. a_load_ref_reg(list,OS_32,OS_32,href,hloc^.register);
  1519. end;
  1520. OS_64,
  1521. OS_F64:
  1522. cg64.a_load64_ref_cgpara(list,href,paraloc);
  1523. else
  1524. a_load_ref_reg(list,hloc^.size,hloc^.size,href,hloc^.register);
  1525. end;
  1526. LOC_REFERENCE :
  1527. begin
  1528. reference_reset_base(href2,hloc^.reference.index,hloc^.reference.offset,paraloc.alignment,[]);
  1529. { concatcopy should choose the best way to copy the data }
  1530. g_concatcopy(list,href,href2,tcgsize2size[hloc^.size]);
  1531. end;
  1532. else
  1533. internalerror(200408241);
  1534. end;
  1535. inc(href.offset,tcgsize2size[hloc^.size]);
  1536. hloc:=hloc^.next;
  1537. end;
  1538. end;
  1539. procedure tbasecgarm.a_loadfpu_reg_reg(list: TAsmList; fromsize,tosize: tcgsize; reg1, reg2: tregister);
  1540. begin
  1541. list.concat(setoppostfix(taicpu.op_reg_reg(A_MVF,reg2,reg1),cgsize2fpuoppostfix[tosize]));
  1542. end;
  1543. procedure tbasecgarm.a_loadfpu_ref_reg(list: TAsmList; fromsize,tosize: tcgsize; const ref: treference; reg: tregister);
  1544. var
  1545. oppostfix:toppostfix;
  1546. begin
  1547. case fromsize of
  1548. OS_32,
  1549. OS_F32:
  1550. oppostfix:=PF_S;
  1551. OS_64,
  1552. OS_F64:
  1553. oppostfix:=PF_D;
  1554. OS_F80:
  1555. oppostfix:=PF_E;
  1556. else
  1557. InternalError(200309021);
  1558. end;
  1559. handle_load_store(list,A_LDF,oppostfix,reg,ref);
  1560. if fromsize<>tosize then
  1561. a_loadfpu_reg_reg(list,fromsize,tosize,reg,reg);
  1562. end;
  1563. procedure tbasecgarm.a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);
  1564. var
  1565. oppostfix:toppostfix;
  1566. begin
  1567. case tosize of
  1568. OS_F32:
  1569. oppostfix:=PF_S;
  1570. OS_F64:
  1571. oppostfix:=PF_D;
  1572. OS_F80:
  1573. oppostfix:=PF_E;
  1574. else
  1575. InternalError(200309022);
  1576. end;
  1577. handle_load_store(list,A_STF,oppostfix,reg,ref);
  1578. end;
  1579. { comparison operations }
  1580. procedure tbasecgarm.a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  1581. l : tasmlabel);
  1582. var
  1583. tmpreg : tregister;
  1584. b : byte;
  1585. begin
  1586. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1587. if (not(GenerateThumbCode) and is_shifter_const(a,b)) or
  1588. ((GenerateThumbCode) and is_thumb_imm(a)) then
  1589. list.concat(taicpu.op_reg_const(A_CMP,reg,a))
  1590. { CMN reg,0 and CMN reg,$80000000 are different from CMP reg,$ffffffff
  1591. and CMP reg,$7fffffff regarding the flags according to the ARM manual }
  1592. else if (a<>$7fffffff) and (a<>-1) and not(GenerateThumbCode) and is_shifter_const(-a,b) then
  1593. list.concat(taicpu.op_reg_const(A_CMN,reg,-a))
  1594. else
  1595. begin
  1596. tmpreg:=getintregister(list,size);
  1597. a_load_const_reg(list,size,a,tmpreg);
  1598. list.concat(taicpu.op_reg_reg(A_CMP,reg,tmpreg));
  1599. end;
  1600. a_jmp_cond(list,cmp_op,l);
  1601. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1602. end;
  1603. procedure tbasecgarm.a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister);
  1604. begin
  1605. if reverse then
  1606. begin
  1607. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,src));
  1608. list.Concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,31));
  1609. list.Concat(taicpu.op_reg_reg_const(A_AND,dst,dst,255));
  1610. end
  1611. { it is decided during the compilation of the system unit if this code is used or not
  1612. so no additional check for rbit is needed }
  1613. else
  1614. begin
  1615. list.Concat(taicpu.op_reg_reg(A_RBIT,dst,src));
  1616. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,dst));
  1617. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1618. list.Concat(taicpu.op_reg_const(A_CMP,dst,32));
  1619. if GenerateThumb2Code then
  1620. list.Concat(taicpu.op_cond(A_IT, C_EQ));
  1621. list.Concat(setcondition(taicpu.op_reg_const(A_MOV,dst,$ff),C_EQ));
  1622. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1623. end;
  1624. end;
  1625. procedure tbasecgarm.a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel);
  1626. begin
  1627. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1628. list.concat(taicpu.op_reg_reg(A_CMP,reg2,reg1));
  1629. a_jmp_cond(list,cmp_op,l);
  1630. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1631. end;
  1632. procedure tbasecgarm.a_jmp_name(list : TAsmList;const s : string);
  1633. var
  1634. ai : taicpu;
  1635. begin
  1636. { generate far jump, leave it to the optimizer to get rid of it }
  1637. if GenerateThumbCode then
  1638. ai:=taicpu.op_sym(A_BL,current_asmdata.RefAsmSymbol(s,AT_FUNCTION))
  1639. else
  1640. ai:=taicpu.op_sym(A_B,current_asmdata.RefAsmSymbol(s,AT_FUNCTION));
  1641. ai.is_jmp:=true;
  1642. list.concat(ai);
  1643. end;
  1644. procedure tbasecgarm.a_jmp_always(list : TAsmList;l: tasmlabel);
  1645. var
  1646. ai : taicpu;
  1647. begin
  1648. { generate far jump, leave it to the optimizer to get rid of it }
  1649. if GenerateThumbCode then
  1650. ai:=taicpu.op_sym(A_BL,l)
  1651. else
  1652. ai:=taicpu.op_sym(A_B,l);
  1653. ai.is_jmp:=true;
  1654. list.concat(ai);
  1655. end;
  1656. procedure tbasecgarm.a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel);
  1657. var
  1658. ai : taicpu;
  1659. inv_flags : TResFlags;
  1660. hlabel : TAsmLabel;
  1661. begin
  1662. if GenerateThumbCode then
  1663. begin
  1664. inv_flags:=f;
  1665. inverse_flags(inv_flags);
  1666. { the optimizer has to fix this if jump range is sufficient short }
  1667. current_asmdata.getjumplabel(hlabel);
  1668. ai:=setcondition(taicpu.op_sym(A_B,hlabel),flags_to_cond(inv_flags));
  1669. ai.is_jmp:=true;
  1670. list.concat(ai);
  1671. a_jmp_always(list,l);
  1672. a_label(list,hlabel);
  1673. end
  1674. else
  1675. begin
  1676. ai:=setcondition(taicpu.op_sym(A_B,l),flags_to_cond(f));
  1677. ai.is_jmp:=true;
  1678. list.concat(ai);
  1679. end;
  1680. end;
  1681. procedure tbasecgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  1682. begin
  1683. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  1684. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  1685. end;
  1686. procedure tbasecgarm.g_profilecode(list : TAsmList);
  1687. begin
  1688. if target_info.system = system_arm_linux then
  1689. begin
  1690. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R14]));
  1691. a_call_name(list,'__gnu_mcount_nc',false);
  1692. end
  1693. else
  1694. internalerror(2014091201);
  1695. end;
  1696. procedure tbasecgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  1697. var
  1698. ref : treference;
  1699. shift : byte;
  1700. firstfloatreg,lastfloatreg,
  1701. r : byte;
  1702. mmregs,
  1703. regs, saveregs : tcpuregisterset;
  1704. registerarea,
  1705. r7offset,
  1706. stackmisalignment : pint;
  1707. imm1, imm2: DWord;
  1708. stack_parameters : Boolean;
  1709. begin
  1710. LocalSize:=align(LocalSize,4);
  1711. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  1712. { call instruction does not put anything on the stack }
  1713. registerarea:=0;
  1714. tarmprocinfo(current_procinfo).stackpaddingreg:=High(TSuperRegister);
  1715. lastfloatreg:=RS_NO;
  1716. if not(nostackframe) then
  1717. begin
  1718. firstfloatreg:=RS_NO;
  1719. mmregs:=[];
  1720. case current_settings.fputype of
  1721. fpu_fpa,
  1722. fpu_fpa10,
  1723. fpu_fpa11:
  1724. begin
  1725. { save floating point registers? }
  1726. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1727. for r:=RS_F0 to RS_F7 do
  1728. if r in regs then
  1729. begin
  1730. if firstfloatreg=RS_NO then
  1731. firstfloatreg:=r;
  1732. lastfloatreg:=r;
  1733. inc(registerarea,12);
  1734. end;
  1735. end;
  1736. fpu_vfpv2,
  1737. fpu_vfpv3,
  1738. fpu_vfpv4,
  1739. fpu_vfpv3_d16:
  1740. begin;
  1741. { the *[0..31] is a hack to prevent that the compiler tries to save odd single-type registers,
  1742. they have numbers>$1f which is not really correct as they should simply have the same numbers
  1743. as the even ones by with a different subtype as it is done on x86 with al/ah }
  1744. mmregs:=(rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall))*[0..31];
  1745. end;
  1746. end;
  1747. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1748. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1749. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  1750. { save int registers }
  1751. reference_reset(ref,4,[]);
  1752. ref.index:=NR_STACK_POINTER_REG;
  1753. ref.addressmode:=AM_PREINDEXED;
  1754. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  1755. if not(target_info.system in systems_darwin) then
  1756. begin
  1757. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1758. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1759. begin
  1760. a_reg_alloc(list,NR_R12);
  1761. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  1762. end;
  1763. { the (old) ARM APCS requires saving both the stack pointer (to
  1764. crawl the stack) and the PC (to identify the function this
  1765. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  1766. and R15 -- still needs updating for EABI and Darwin, they don't
  1767. need that }
  1768. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1769. regs:=regs+[RS_FRAME_POINTER_REG,RS_R12,RS_R14,RS_R15]
  1770. else
  1771. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1772. include(regs,RS_R14);
  1773. if regs<>[] then
  1774. begin
  1775. for r:=RS_R0 to RS_R15 do
  1776. if r in regs then
  1777. inc(registerarea,4);
  1778. { if the stack is not 8 byte aligned, try to add an extra register,
  1779. so we can avoid the extra sub/add ...,#4 later (KB) }
  1780. if ((registerarea mod current_settings.alignment.localalignmax) <> 0) then
  1781. for r:=RS_R3 downto RS_R0 do
  1782. if not(r in regs) then
  1783. begin
  1784. regs:=regs+[r];
  1785. inc(registerarea,4);
  1786. tarmprocinfo(current_procinfo).stackpaddingreg:=r;
  1787. break;
  1788. end;
  1789. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  1790. end;
  1791. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1792. begin
  1793. { the framepointer now points to the saved R15, so the saved
  1794. framepointer is at R11-12 (for get_caller_frame) }
  1795. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  1796. a_reg_dealloc(list,NR_R12);
  1797. end;
  1798. end
  1799. else
  1800. begin
  1801. { always save r14 if we use r7 as the framepointer, because
  1802. the parameter offsets are hardcoded in advance and always
  1803. assume that r14 sits on the stack right behind the saved r7
  1804. }
  1805. if current_procinfo.framepointer=NR_FRAME_POINTER_REG then
  1806. include(regs,RS_FRAME_POINTER_REG);
  1807. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1808. include(regs,RS_R14);
  1809. if regs<>[] then
  1810. begin
  1811. { on Darwin, you first have to save [r4-r7,lr], and then
  1812. [r8,r10,r11] and make r7 point to the previously saved
  1813. r7 so that you can perform a stack crawl based on it
  1814. ([r7] is previous stack frame, [r7+4] is return address
  1815. }
  1816. include(regs,RS_FRAME_POINTER_REG);
  1817. saveregs:=regs-[RS_R8,RS_R10,RS_R11];
  1818. r7offset:=0;
  1819. for r:=RS_R0 to RS_R15 do
  1820. if r in saveregs then
  1821. begin
  1822. inc(registerarea,4);
  1823. if r<RS_FRAME_POINTER_REG then
  1824. inc(r7offset,4);
  1825. end;
  1826. { save the registers }
  1827. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1828. { make r7 point to the saved r7 (regardless of whether this
  1829. frame uses the framepointer, for backtrace purposes) }
  1830. if r7offset<>0 then
  1831. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_FRAME_POINTER_REG,NR_R13,r7offset))
  1832. else
  1833. list.concat(taicpu.op_reg_reg(A_MOV,NR_R7,NR_R13));
  1834. { now save the rest (if any) }
  1835. saveregs:=regs-saveregs;
  1836. if saveregs<>[] then
  1837. begin
  1838. for r:=RS_R8 to RS_R11 do
  1839. if r in saveregs then
  1840. inc(registerarea,4);
  1841. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1842. end;
  1843. end;
  1844. end;
  1845. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  1846. if (LocalSize<>0) or
  1847. ((stackmisalignment<>0) and
  1848. ((pi_do_call in current_procinfo.flags) or
  1849. (po_assembler in current_procinfo.procdef.procoptions))) then
  1850. begin
  1851. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  1852. if stack_parameters and (pi_estimatestacksize in current_procinfo.flags) then
  1853. begin
  1854. if localsize>tarmprocinfo(current_procinfo).stackframesize then
  1855. internalerror(2014030901)
  1856. else
  1857. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea;
  1858. end;
  1859. if is_shifter_const(localsize,shift) then
  1860. begin
  1861. a_reg_dealloc(list,NR_R12);
  1862. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  1863. end
  1864. else if split_into_shifter_const(localsize, imm1, imm2) then
  1865. begin
  1866. a_reg_dealloc(list,NR_R12);
  1867. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  1868. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  1869. end
  1870. else
  1871. begin
  1872. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  1873. a_reg_alloc(list,NR_R12);
  1874. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  1875. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  1876. a_reg_dealloc(list,NR_R12);
  1877. end;
  1878. end;
  1879. if (mmregs<>[]) or
  1880. (firstfloatreg<>RS_NO) then
  1881. begin
  1882. reference_reset(ref,4,[]);
  1883. if (tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023) or
  1884. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv4,fpu_vfpv3_d16]) then
  1885. begin
  1886. if not is_shifter_const(tarmprocinfo(current_procinfo).floatregstart,shift) then
  1887. begin
  1888. a_reg_alloc(list,NR_R12);
  1889. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  1890. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1891. a_reg_dealloc(list,NR_R12);
  1892. end
  1893. else
  1894. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tarmprocinfo(current_procinfo).floatregstart));
  1895. ref.base:=NR_R12;
  1896. end
  1897. else
  1898. begin
  1899. ref.base:=current_procinfo.framepointer;
  1900. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  1901. end;
  1902. case current_settings.fputype of
  1903. fpu_fpa,
  1904. fpu_fpa10,
  1905. fpu_fpa11:
  1906. begin
  1907. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  1908. lastfloatreg-firstfloatreg+1,ref));
  1909. end;
  1910. fpu_vfpv2,
  1911. fpu_vfpv3,
  1912. fpu_vfpv4,
  1913. fpu_vfpv3_d16:
  1914. begin
  1915. ref.index:=ref.base;
  1916. ref.base:=NR_NO;
  1917. { FSTMX is deprecated on ARMv6 and later }
  1918. {if (current_settings.cputype<cpu_armv6) then
  1919. postfix:=PF_IAX
  1920. else
  1921. postfix:=PF_IAD;}
  1922. if mmregs<>[] then
  1923. list.concat(taicpu.op_ref_regset(A_VSTM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  1924. end;
  1925. end;
  1926. end;
  1927. end;
  1928. end;
  1929. procedure tbasecgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  1930. var
  1931. ref : treference;
  1932. LocalSize : longint;
  1933. firstfloatreg,lastfloatreg,
  1934. r,
  1935. shift : byte;
  1936. mmregs,
  1937. saveregs,
  1938. regs : tcpuregisterset;
  1939. registerarea,
  1940. stackmisalignment: pint;
  1941. paddingreg: TSuperRegister;
  1942. imm1, imm2: DWord;
  1943. begin
  1944. if not(nostackframe) then
  1945. begin
  1946. registerarea:=0;
  1947. firstfloatreg:=RS_NO;
  1948. lastfloatreg:=RS_NO;
  1949. mmregs:=[];
  1950. saveregs:=[];
  1951. case current_settings.fputype of
  1952. fpu_fpa,
  1953. fpu_fpa10,
  1954. fpu_fpa11:
  1955. begin
  1956. { restore floating point registers? }
  1957. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1958. for r:=RS_F0 to RS_F7 do
  1959. if r in regs then
  1960. begin
  1961. if firstfloatreg=RS_NO then
  1962. firstfloatreg:=r;
  1963. lastfloatreg:=r;
  1964. { floating point register space is already included in
  1965. localsize below by calc_stackframe_size
  1966. inc(registerarea,12);
  1967. }
  1968. end;
  1969. end;
  1970. fpu_vfpv2,
  1971. fpu_vfpv3,
  1972. fpu_vfpv4,
  1973. fpu_vfpv3_d16:
  1974. begin;
  1975. { restore vfp registers? }
  1976. { the *[0..31] is a hack to prevent that the compiler tries to save odd single-type registers,
  1977. they have numbers>$1f which is not really correct as they should simply have the same numbers
  1978. as the even ones by with a different subtype as it is done on x86 with al/ah }
  1979. mmregs:=(rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall))*[0..31];
  1980. end;
  1981. end;
  1982. if (firstfloatreg<>RS_NO) or
  1983. (mmregs<>[]) then
  1984. begin
  1985. reference_reset(ref,4,[]);
  1986. if (tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023) or
  1987. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv4,fpu_vfpv3_d16]) then
  1988. begin
  1989. if not is_shifter_const(tarmprocinfo(current_procinfo).floatregstart,shift) then
  1990. begin
  1991. a_reg_alloc(list,NR_R12);
  1992. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  1993. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1994. a_reg_dealloc(list,NR_R12);
  1995. end
  1996. else
  1997. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tarmprocinfo(current_procinfo).floatregstart));
  1998. ref.base:=NR_R12;
  1999. end
  2000. else
  2001. begin
  2002. ref.base:=current_procinfo.framepointer;
  2003. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  2004. end;
  2005. case current_settings.fputype of
  2006. fpu_fpa,
  2007. fpu_fpa10,
  2008. fpu_fpa11:
  2009. begin
  2010. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  2011. lastfloatreg-firstfloatreg+1,ref));
  2012. end;
  2013. fpu_vfpv2,
  2014. fpu_vfpv3,
  2015. fpu_vfpv4,
  2016. fpu_vfpv3_d16:
  2017. begin
  2018. ref.index:=ref.base;
  2019. ref.base:=NR_NO;
  2020. { FLDMX is deprecated on ARMv6 and later }
  2021. {if (current_settings.cputype<cpu_armv6) then
  2022. mmpostfix:=PF_IAX
  2023. else
  2024. mmpostfix:=PF_IAD;}
  2025. if mmregs<>[] then
  2026. list.concat(taicpu.op_ref_regset(A_VLDM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  2027. end;
  2028. end;
  2029. end;
  2030. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  2031. if (pi_do_call in current_procinfo.flags) or
  2032. (regs<>[]) or
  2033. ((target_info.system in systems_darwin) and
  2034. (current_procinfo.framepointer<>NR_STACK_POINTER_REG)) then
  2035. begin
  2036. exclude(regs,RS_R14);
  2037. include(regs,RS_R15);
  2038. if (target_info.system in systems_darwin) then
  2039. include(regs,RS_FRAME_POINTER_REG);
  2040. end;
  2041. if not(target_info.system in systems_darwin) then
  2042. begin
  2043. { restore saved stack pointer to SP (R13) and saved lr to PC (R15).
  2044. The saved PC came after that but is discarded, since we restore
  2045. the stack pointer }
  2046. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  2047. regs:=regs+[RS_FRAME_POINTER_REG,RS_R13,RS_R15];
  2048. end
  2049. else
  2050. begin
  2051. { restore R8-R11 already if necessary (they've been stored
  2052. before the others) }
  2053. saveregs:=regs*[RS_R8,RS_R10,RS_R11];
  2054. if saveregs<>[] then
  2055. begin
  2056. reference_reset(ref,4,[]);
  2057. ref.index:=NR_STACK_POINTER_REG;
  2058. ref.addressmode:=AM_PREINDEXED;
  2059. for r:=RS_R8 to RS_R11 do
  2060. if r in saveregs then
  2061. inc(registerarea,4);
  2062. regs:=regs-saveregs;
  2063. end;
  2064. end;
  2065. for r:=RS_R0 to RS_R15 do
  2066. if r in regs then
  2067. inc(registerarea,4);
  2068. { reapply the stack padding reg, in case there was one, see the complimentary
  2069. comment in g_proc_entry() (KB) }
  2070. paddingreg:=tarmprocinfo(current_procinfo).stackpaddingreg;
  2071. if paddingreg < RS_R4 then
  2072. if paddingreg in regs then
  2073. internalerror(201306190)
  2074. else
  2075. begin
  2076. regs:=regs+[paddingreg];
  2077. inc(registerarea,4);
  2078. end;
  2079. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  2080. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  2081. (target_info.system in systems_darwin) then
  2082. begin
  2083. LocalSize:=current_procinfo.calc_stackframe_size;
  2084. if (LocalSize<>0) or
  2085. ((stackmisalignment<>0) and
  2086. ((pi_do_call in current_procinfo.flags) or
  2087. (po_assembler in current_procinfo.procdef.procoptions))) then
  2088. begin
  2089. if pi_estimatestacksize in current_procinfo.flags then
  2090. LocalSize:=tarmprocinfo(current_procinfo).stackframesize-registerarea
  2091. else
  2092. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  2093. if is_shifter_const(LocalSize,shift) then
  2094. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  2095. else if split_into_shifter_const(localsize, imm1, imm2) then
  2096. begin
  2097. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  2098. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  2099. end
  2100. else
  2101. begin
  2102. a_reg_alloc(list,NR_R12);
  2103. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  2104. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  2105. a_reg_dealloc(list,NR_R12);
  2106. end;
  2107. end;
  2108. if (target_info.system in systems_darwin) and
  2109. (saveregs<>[]) then
  2110. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  2111. if regs=[] then
  2112. begin
  2113. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2114. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2115. else
  2116. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2117. end
  2118. else
  2119. begin
  2120. reference_reset(ref,4,[]);
  2121. ref.index:=NR_STACK_POINTER_REG;
  2122. ref.addressmode:=AM_PREINDEXED;
  2123. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  2124. end;
  2125. end
  2126. else
  2127. begin
  2128. { restore int registers and return }
  2129. reference_reset(ref,4,[]);
  2130. ref.index:=NR_FRAME_POINTER_REG;
  2131. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_EA));
  2132. end;
  2133. end
  2134. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2135. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2136. else
  2137. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2138. end;
  2139. procedure tbasecgarm.g_maybe_got_init(list : TAsmList);
  2140. var
  2141. ref : treference;
  2142. l : TAsmLabel;
  2143. regs : tcpuregisterset;
  2144. r: byte;
  2145. begin
  2146. if (cs_create_pic in current_settings.moduleswitches) and
  2147. (pi_needs_got in current_procinfo.flags) and
  2148. (tf_pic_uses_got in target_info.flags) then
  2149. begin
  2150. { Procedure parametrs are not initialized at this stage.
  2151. Before GOT initialization code, allocate registers used for procedure parameters
  2152. to prevent usage of these registers for temp operations in later stages of code
  2153. generation. }
  2154. regs:=rg[R_INTREGISTER].used_in_proc;
  2155. for r:=RS_R0 to RS_R3 do
  2156. if r in regs then
  2157. a_reg_alloc(list, newreg(R_INTREGISTER,r,R_SUBWHOLE));
  2158. { Allocate scratch register R12 and use it for GOT calculations directly.
  2159. Otherwise the init code can be distorted in later stages of code generation. }
  2160. a_reg_alloc(list,NR_R12);
  2161. reference_reset(ref,4,[]);
  2162. current_asmdata.getglobaldatalabel(l);
  2163. cg.a_label(current_procinfo.aktlocaldata,l);
  2164. ref.symbol:=l;
  2165. ref.base:=NR_PC;
  2166. ref.symboldata:=current_procinfo.aktlocaldata.last;
  2167. list.concat(Taicpu.op_reg_ref(A_LDR,NR_R12,ref));
  2168. current_asmdata.getaddrlabel(l);
  2169. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_32bit,l,current_asmdata.RefAsmSymbol('_GLOBAL_OFFSET_TABLE_',AT_DATA),-8));
  2170. cg.a_label(list,l);
  2171. list.concat(Taicpu.op_reg_reg_reg(A_ADD,NR_R12,NR_PC,NR_R12));
  2172. list.concat(Taicpu.op_reg_reg(A_MOV,current_procinfo.got,NR_R12));
  2173. { Deallocate registers }
  2174. a_reg_dealloc(list,NR_R12);
  2175. for r:=RS_R3 downto RS_R0 do
  2176. if r in regs then
  2177. a_reg_dealloc(list, newreg(R_INTREGISTER,r,R_SUBWHOLE));
  2178. end;
  2179. end;
  2180. procedure tbasecgarm.a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);
  2181. var
  2182. b : byte;
  2183. tmpref : treference;
  2184. instr : taicpu;
  2185. begin
  2186. if ref.addressmode<>AM_OFFSET then
  2187. internalerror(200309071);
  2188. tmpref:=ref;
  2189. { Be sure to have a base register }
  2190. if (tmpref.base=NR_NO) then
  2191. begin
  2192. if tmpref.shiftmode<>SM_None then
  2193. internalerror(2014020702);
  2194. if tmpref.signindex<0 then
  2195. internalerror(200312023);
  2196. tmpref.base:=tmpref.index;
  2197. tmpref.index:=NR_NO;
  2198. end;
  2199. if assigned(tmpref.symbol) or
  2200. not((is_shifter_const(tmpref.offset,b)) or
  2201. (is_shifter_const(-tmpref.offset,b))
  2202. ) then
  2203. fixref(list,tmpref);
  2204. { expect a base here if there is an index }
  2205. if (tmpref.base=NR_NO) and (tmpref.index<>NR_NO) then
  2206. internalerror(200312022);
  2207. if tmpref.index<>NR_NO then
  2208. begin
  2209. if tmpref.shiftmode<>SM_None then
  2210. internalerror(200312021);
  2211. if tmpref.signindex<0 then
  2212. a_op_reg_reg_reg(list,OP_SUB,OS_ADDR,tmpref.base,tmpref.index,r)
  2213. else
  2214. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpref.base,tmpref.index,r);
  2215. if tmpref.offset<>0 then
  2216. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,r,r);
  2217. end
  2218. else
  2219. begin
  2220. if tmpref.base=NR_NO then
  2221. a_load_const_reg(list,OS_ADDR,tmpref.offset,r)
  2222. else
  2223. if tmpref.offset<>0 then
  2224. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,tmpref.base,r)
  2225. else
  2226. begin
  2227. instr:=taicpu.op_reg_reg(A_MOV,r,tmpref.base);
  2228. list.concat(instr);
  2229. add_move_instruction(instr);
  2230. end;
  2231. end;
  2232. end;
  2233. procedure tbasecgarm.fixref(list : TAsmList;var ref : treference);
  2234. var
  2235. tmpreg, tmpreg2 : tregister;
  2236. tmpref : treference;
  2237. l, piclabel : tasmlabel;
  2238. indirection_done : boolean;
  2239. begin
  2240. { absolute symbols can't be handled directly, we've to store the symbol reference
  2241. in the text segment and access it pc relative
  2242. For now, we assume that references where base or index equals to PC are already
  2243. relative, all other references are assumed to be absolute and thus they need
  2244. to be handled extra.
  2245. A proper solution would be to change refoptions to a set and store the information
  2246. if the symbol is absolute or relative there.
  2247. }
  2248. { create consts entry }
  2249. reference_reset(tmpref,4,[]);
  2250. current_asmdata.getjumplabel(l);
  2251. cg.a_label(current_procinfo.aktlocaldata,l);
  2252. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  2253. piclabel:=nil;
  2254. tmpreg:=NR_NO;
  2255. indirection_done:=false;
  2256. if assigned(ref.symbol) then
  2257. begin
  2258. if (target_info.system=system_arm_darwin) and
  2259. (ref.symbol.bind in [AB_EXTERNAL,AB_WEAK_EXTERNAL,AB_PRIVATE_EXTERN,AB_COMMON]) then
  2260. begin
  2261. tmpreg:=g_indirect_sym_load(list,ref.symbol.name,asmsym2indsymflags(ref.symbol));
  2262. if ref.offset<>0 then
  2263. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2264. indirection_done:=true;
  2265. end
  2266. else if (cs_create_pic in current_settings.moduleswitches) then
  2267. if (tf_pic_uses_got in target_info.flags) then
  2268. current_procinfo.aktlocaldata.concat(tai_const.Create_type_sym(aitconst_got,ref.symbol))
  2269. else
  2270. begin
  2271. { ideally, we would want to generate
  2272. ldr r1, LPICConstPool
  2273. LPICLocal:
  2274. ldr/str r2,[pc,r1]
  2275. ...
  2276. LPICConstPool:
  2277. .long _globsym-(LPICLocal+8)
  2278. However, we cannot be sure that the ldr/str will follow
  2279. right after the call to fixref, so we have to load the
  2280. complete address already in a register.
  2281. }
  2282. current_asmdata.getaddrlabel(piclabel);
  2283. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_ptr,piclabel,ref.symbol,ref.offset-8));
  2284. end
  2285. else
  2286. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset))
  2287. end
  2288. else
  2289. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ref.offset));
  2290. { load consts entry }
  2291. if not indirection_done then
  2292. begin
  2293. tmpreg:=getintregister(list,OS_INT);
  2294. tmpref.symbol:=l;
  2295. tmpref.base:=NR_PC;
  2296. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2297. if (cs_create_pic in current_settings.moduleswitches) and
  2298. (tf_pic_uses_got in target_info.flags) and
  2299. assigned(ref.symbol) then
  2300. begin
  2301. reference_reset(tmpref,4,[]);
  2302. tmpref.base:=current_procinfo.got;
  2303. tmpref.index:=tmpreg;
  2304. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2305. if ref.offset<>0 then
  2306. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2307. end;
  2308. end;
  2309. if assigned(piclabel) then
  2310. begin
  2311. cg.a_label(list,piclabel);
  2312. tmpreg2:=getaddressregister(list);
  2313. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpreg,NR_PC,tmpreg2);
  2314. tmpreg:=tmpreg2
  2315. end;
  2316. { This routine can be called with PC as base/index in case the offset
  2317. was too large to encode in a load/store. In that case, the entire
  2318. absolute expression has been re-encoded in a new constpool entry, and
  2319. we have to remove the use of PC from the original reference (the code
  2320. above made everything relative to the value loaded from the new
  2321. constpool entry) }
  2322. if is_pc(ref.base) then
  2323. ref.base:=NR_NO;
  2324. if is_pc(ref.index) then
  2325. ref.index:=NR_NO;
  2326. if (ref.base<>NR_NO) then
  2327. begin
  2328. if ref.index<>NR_NO then
  2329. begin
  2330. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  2331. ref.base:=tmpreg;
  2332. end
  2333. else
  2334. if ref.base<>NR_PC then
  2335. begin
  2336. ref.index:=tmpreg;
  2337. ref.shiftimm:=0;
  2338. ref.signindex:=1;
  2339. ref.shiftmode:=SM_None;
  2340. end
  2341. else
  2342. ref.base:=tmpreg;
  2343. end
  2344. else
  2345. ref.base:=tmpreg;
  2346. ref.offset:=0;
  2347. ref.symbol:=nil;
  2348. end;
  2349. procedure tbasecgarm.g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  2350. var
  2351. paraloc1,paraloc2,paraloc3 : TCGPara;
  2352. pd : tprocdef;
  2353. begin
  2354. pd:=search_system_proc('MOVE');
  2355. paraloc1.init;
  2356. paraloc2.init;
  2357. paraloc3.init;
  2358. paramanager.getintparaloc(list,pd,1,paraloc1);
  2359. paramanager.getintparaloc(list,pd,2,paraloc2);
  2360. paramanager.getintparaloc(list,pd,3,paraloc3);
  2361. a_load_const_cgpara(list,OS_SINT,len,paraloc3);
  2362. a_loadaddr_ref_cgpara(list,dest,paraloc2);
  2363. a_loadaddr_ref_cgpara(list,source,paraloc1);
  2364. paramanager.freecgpara(list,paraloc3);
  2365. paramanager.freecgpara(list,paraloc2);
  2366. paramanager.freecgpara(list,paraloc1);
  2367. alloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2368. alloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2369. a_call_name(list,'FPC_MOVE',false);
  2370. dealloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2371. dealloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2372. paraloc3.done;
  2373. paraloc2.done;
  2374. paraloc1.done;
  2375. end;
  2376. procedure tbasecgarm.g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  2377. const
  2378. maxtmpreg_arm = 10; {roozbeh: can be reduced to 8 or lower if might conflick with reserved ones,also +2 is used becouse of regs required for referencing}
  2379. maxtmpreg_thumb = 5;
  2380. var
  2381. srcref,dstref,usedtmpref,usedtmpref2:treference;
  2382. srcreg,destreg,countreg,r,tmpreg:tregister;
  2383. helpsize:aint;
  2384. copysize:byte;
  2385. cgsize:Tcgsize;
  2386. tmpregisters:array[1..maxtmpreg_arm] of tregister;
  2387. maxtmpreg,
  2388. tmpregi,tmpregi2:byte;
  2389. { will never be called with count<=4 }
  2390. procedure genloop(count : aword;size : byte);
  2391. const
  2392. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2393. var
  2394. l : tasmlabel;
  2395. begin
  2396. current_asmdata.getjumplabel(l);
  2397. if count<size then size:=1;
  2398. a_load_const_reg(list,OS_INT,count div size,countreg);
  2399. cg.a_label(list,l);
  2400. srcref.addressmode:=AM_POSTINDEXED;
  2401. dstref.addressmode:=AM_POSTINDEXED;
  2402. srcref.offset:=size;
  2403. dstref.offset:=size;
  2404. r:=getintregister(list,size2opsize[size]);
  2405. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2406. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2407. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1),PF_S));
  2408. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2409. a_jmp_flags(list,F_NE,l);
  2410. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2411. srcref.offset:=1;
  2412. dstref.offset:=1;
  2413. case count mod size of
  2414. 1:
  2415. begin
  2416. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2417. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2418. end;
  2419. 2:
  2420. if aligned then
  2421. begin
  2422. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2423. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2424. end
  2425. else
  2426. begin
  2427. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2428. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2429. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2430. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2431. end;
  2432. 3:
  2433. if aligned then
  2434. begin
  2435. srcref.offset:=2;
  2436. dstref.offset:=2;
  2437. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2438. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2439. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2440. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2441. end
  2442. else
  2443. begin
  2444. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2445. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2446. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2447. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2448. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2449. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2450. end;
  2451. end;
  2452. { keep the registers alive }
  2453. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2454. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2455. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2456. end;
  2457. { will never be called with count<=4 }
  2458. procedure genloop_thumb(count : aword;size : byte);
  2459. procedure refincofs(const ref : treference;const value : longint = 1);
  2460. begin
  2461. a_op_const_reg(list,OP_ADD,OS_ADDR,value,ref.base);
  2462. end;
  2463. const
  2464. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2465. var
  2466. l : tasmlabel;
  2467. begin
  2468. current_asmdata.getjumplabel(l);
  2469. if count<size then size:=1;
  2470. a_load_const_reg(list,OS_INT,count div size,countreg);
  2471. cg.a_label(list,l);
  2472. r:=getintregister(list,size2opsize[size]);
  2473. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2474. refincofs(srcref);
  2475. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2476. refincofs(dstref);
  2477. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2478. list.concat(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1));
  2479. a_jmp_flags(list,F_NE,l);
  2480. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2481. case count mod size of
  2482. 1:
  2483. begin
  2484. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2485. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2486. end;
  2487. 2:
  2488. if aligned then
  2489. begin
  2490. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2491. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2492. end
  2493. else
  2494. begin
  2495. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2496. refincofs(srcref);
  2497. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2498. refincofs(dstref);
  2499. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2500. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2501. end;
  2502. 3:
  2503. if aligned then
  2504. begin
  2505. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2506. refincofs(srcref,2);
  2507. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2508. refincofs(dstref,2);
  2509. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2510. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2511. end
  2512. else
  2513. begin
  2514. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2515. refincofs(srcref);
  2516. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2517. refincofs(dstref);
  2518. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2519. refincofs(srcref);
  2520. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2521. refincofs(dstref);
  2522. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2523. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2524. end;
  2525. end;
  2526. { keep the registers alive }
  2527. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2528. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2529. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2530. end;
  2531. begin
  2532. if len=0 then
  2533. exit;
  2534. if GenerateThumbCode then
  2535. maxtmpreg:=maxtmpreg_thumb
  2536. else
  2537. maxtmpreg:=maxtmpreg_arm;
  2538. helpsize:=12+maxtmpreg*4;//52 with maxtmpreg=10
  2539. dstref:=dest;
  2540. srcref:=source;
  2541. if cs_opt_size in current_settings.optimizerswitches then
  2542. helpsize:=8;
  2543. if aligned and (len=4) then
  2544. begin
  2545. tmpreg:=getintregister(list,OS_32);
  2546. a_load_ref_reg(list,OS_32,OS_32,source,tmpreg);
  2547. a_load_reg_ref(list,OS_32,OS_32,tmpreg,dest);
  2548. end
  2549. else if aligned and (len=2) then
  2550. begin
  2551. tmpreg:=getintregister(list,OS_16);
  2552. a_load_ref_reg(list,OS_16,OS_16,source,tmpreg);
  2553. a_load_reg_ref(list,OS_16,OS_16,tmpreg,dest);
  2554. end
  2555. else if (len<=helpsize) and aligned then
  2556. begin
  2557. tmpregi:=0;
  2558. srcreg:=getintregister(list,OS_ADDR);
  2559. { explicit pc relative addressing, could be
  2560. e.g. a floating point constant }
  2561. if source.base=NR_PC then
  2562. begin
  2563. { ... then we don't need a loadaddr }
  2564. srcref:=source;
  2565. end
  2566. else
  2567. begin
  2568. a_loadaddr_ref_reg(list,source,srcreg);
  2569. reference_reset_base(srcref,srcreg,0,source.alignment,source.volatility);
  2570. end;
  2571. while (len div 4 <> 0) and (tmpregi<maxtmpreg) do
  2572. begin
  2573. inc(tmpregi);
  2574. tmpregisters[tmpregi]:=getintregister(list,OS_32);
  2575. a_load_ref_reg(list,OS_32,OS_32,srcref,tmpregisters[tmpregi]);
  2576. inc(srcref.offset,4);
  2577. dec(len,4);
  2578. end;
  2579. destreg:=getintregister(list,OS_ADDR);
  2580. a_loadaddr_ref_reg(list,dest,destreg);
  2581. reference_reset_base(dstref,destreg,0,dest.alignment,dest.volatility);
  2582. tmpregi2:=1;
  2583. while (tmpregi2<=tmpregi) do
  2584. begin
  2585. a_load_reg_ref(list,OS_32,OS_32,tmpregisters[tmpregi2],dstref);
  2586. inc(dstref.offset,4);
  2587. inc(tmpregi2);
  2588. end;
  2589. copysize:=4;
  2590. cgsize:=OS_32;
  2591. while len<>0 do
  2592. begin
  2593. if len<2 then
  2594. begin
  2595. copysize:=1;
  2596. cgsize:=OS_8;
  2597. end
  2598. else if len<4 then
  2599. begin
  2600. copysize:=2;
  2601. cgsize:=OS_16;
  2602. end;
  2603. dec(len,copysize);
  2604. r:=getintregister(list,cgsize);
  2605. a_load_ref_reg(list,cgsize,cgsize,srcref,r);
  2606. a_load_reg_ref(list,cgsize,cgsize,r,dstref);
  2607. inc(srcref.offset,copysize);
  2608. inc(dstref.offset,copysize);
  2609. end;{end of while}
  2610. end
  2611. else
  2612. begin
  2613. cgsize:=OS_32;
  2614. if (len<=4) then{len<=4 and not aligned}
  2615. begin
  2616. r:=getintregister(list,cgsize);
  2617. usedtmpref:=a_internal_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2618. if Len=1 then
  2619. a_load_reg_ref(list,OS_8,OS_8,r,dstref)
  2620. else
  2621. begin
  2622. tmpreg:=getintregister(list,cgsize);
  2623. usedtmpref2:=a_internal_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2624. inc(usedtmpref.offset,1);
  2625. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2626. inc(usedtmpref2.offset,1);
  2627. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2628. if len>2 then
  2629. begin
  2630. inc(usedtmpref.offset,1);
  2631. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2632. inc(usedtmpref2.offset,1);
  2633. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2634. if len>3 then
  2635. begin
  2636. inc(usedtmpref.offset,1);
  2637. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2638. inc(usedtmpref2.offset,1);
  2639. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2640. end;
  2641. end;
  2642. end;
  2643. end{end of if len<=4}
  2644. else
  2645. begin{unaligned & 4<len<helpsize **or** aligned/unaligned & len>helpsize}
  2646. destreg:=getintregister(list,OS_ADDR);
  2647. a_loadaddr_ref_reg(list,dest,destreg);
  2648. reference_reset_base(dstref,destreg,0,dest.alignment,dest.volatility);
  2649. srcreg:=getintregister(list,OS_ADDR);
  2650. a_loadaddr_ref_reg(list,source,srcreg);
  2651. reference_reset_base(srcref,srcreg,0,source.alignment,source.volatility);
  2652. countreg:=getintregister(list,OS_32);
  2653. // if cs_opt_size in current_settings.optimizerswitches then
  2654. { roozbeh : it seems loading 1 byte is faster becouse of caching/fetching(?) }
  2655. {if aligned then
  2656. genloop(len,4)
  2657. else}
  2658. if GenerateThumbCode then
  2659. genloop_thumb(len,1)
  2660. else
  2661. genloop(len,1);
  2662. end;
  2663. end;
  2664. end;
  2665. procedure tbasecgarm.g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);
  2666. begin
  2667. g_concatcopy_internal(list,source,dest,len,false);
  2668. end;
  2669. procedure tbasecgarm.g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);
  2670. begin
  2671. if (source.alignment in [1,3]) or
  2672. (dest.alignment in [1,3]) then
  2673. g_concatcopy_internal(list,source,dest,len,false)
  2674. else
  2675. g_concatcopy_internal(list,source,dest,len,true);
  2676. end;
  2677. procedure tbasecgarm.g_overflowCheck(list : TAsmList;const l : tlocation;def : tdef);
  2678. var
  2679. ovloc : tlocation;
  2680. begin
  2681. ovloc.loc:=LOC_VOID;
  2682. g_overflowCheck_loc(list,l,def,ovloc);
  2683. end;
  2684. procedure tbasecgarm.g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);
  2685. var
  2686. hl : tasmlabel;
  2687. ai:TAiCpu;
  2688. hflags : tresflags;
  2689. begin
  2690. if not(cs_check_overflow in current_settings.localswitches) then
  2691. exit;
  2692. current_asmdata.getjumplabel(hl);
  2693. case ovloc.loc of
  2694. LOC_VOID:
  2695. begin
  2696. ai:=taicpu.op_sym(A_B,hl);
  2697. ai.is_jmp:=true;
  2698. if not((def.typ=pointerdef) or
  2699. ((def.typ=orddef) and
  2700. (torddef(def).ordtype in [u64bit,u16bit,u32bit,u8bit,uchar,
  2701. pasbool8,pasbool16,pasbool32,pasbool64]))) then
  2702. ai.SetCondition(C_VC)
  2703. else
  2704. if TAiCpu(List.Last).opcode in [A_RSB,A_RSC,A_SBC,A_SUB] then
  2705. ai.SetCondition(C_CS)
  2706. else
  2707. ai.SetCondition(C_CC);
  2708. list.concat(ai);
  2709. end;
  2710. LOC_FLAGS:
  2711. begin
  2712. hflags:=ovloc.resflags;
  2713. inverse_flags(hflags);
  2714. cg.a_jmp_flags(list,hflags,hl);
  2715. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2716. end;
  2717. else
  2718. internalerror(200409281);
  2719. end;
  2720. a_call_name(list,'FPC_OVERFLOW',false);
  2721. a_label(list,hl);
  2722. end;
  2723. procedure tbasecgarm.g_save_registers(list : TAsmList);
  2724. begin
  2725. { this work is done in g_proc_entry }
  2726. end;
  2727. procedure tbasecgarm.g_restore_registers(list : TAsmList);
  2728. begin
  2729. { this work is done in g_proc_exit }
  2730. end;
  2731. procedure tbasecgarm.a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  2732. var
  2733. ai : taicpu;
  2734. hlabel : TAsmLabel;
  2735. begin
  2736. if GenerateThumbCode then
  2737. begin
  2738. { the optimizer has to fix this if jump range is sufficient short }
  2739. current_asmdata.getjumplabel(hlabel);
  2740. ai:=Taicpu.Op_sym(A_B,hlabel);
  2741. ai.SetCondition(inverse_cond(OpCmp2AsmCond[cond]));
  2742. ai.is_jmp:=true;
  2743. list.concat(ai);
  2744. a_jmp_always(list,l);
  2745. a_label(list,hlabel);
  2746. end
  2747. else
  2748. begin
  2749. ai:=Taicpu.Op_sym(A_B,l);
  2750. ai.SetCondition(OpCmp2AsmCond[cond]);
  2751. ai.is_jmp:=true;
  2752. list.concat(ai);
  2753. end;
  2754. end;
  2755. function get_scalar_mm_op(fromsize,tosize : tcgsize) : tasmop;
  2756. const
  2757. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of tasmop = (
  2758. (A_VMOV,A_VCVT,A_NONE,A_NONE,A_NONE),
  2759. (A_VCVT,A_VMOV,A_NONE,A_NONE,A_NONE),
  2760. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2761. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2762. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE));
  2763. begin
  2764. result:=convertop[fromsize,tosize];
  2765. if result=A_NONE then
  2766. internalerror(200312205);
  2767. end;
  2768. function get_scalar_mm_prefix(fromsize,tosize : tcgsize) : TOpPostfix;
  2769. const
  2770. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of TOpPostfix = (
  2771. (PF_F32, PF_F32F64,PF_None,PF_None,PF_None),
  2772. (PF_F64F32,PF_F64, PF_None,PF_None,PF_None),
  2773. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2774. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2775. (PF_None, PF_None, PF_None,PF_None,PF_None));
  2776. begin
  2777. result:=convertop[fromsize,tosize];
  2778. end;
  2779. procedure tbasecgarm.a_loadmm_reg_reg(list: tasmlist; fromsize,tosize: tcgsize; reg1,reg2: tregister; shuffle: pmmshuffle);
  2780. var
  2781. instr: taicpu;
  2782. begin
  2783. if (shuffle=nil) or shufflescalar(shuffle) then
  2784. instr:=setoppostfix(taicpu.op_reg_reg(get_scalar_mm_op(tosize,fromsize),reg2,reg1),get_scalar_mm_prefix(tosize,fromsize))
  2785. else
  2786. internalerror(2009112407);
  2787. list.concat(instr);
  2788. case instr.opcode of
  2789. A_VMOV:
  2790. add_move_instruction(instr);
  2791. end;
  2792. end;
  2793. procedure tbasecgarm.a_loadmm_ref_reg(list: tasmlist; fromsize,tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  2794. var
  2795. intreg,
  2796. tmpmmreg : tregister;
  2797. reg64 : tregister64;
  2798. begin
  2799. if assigned(shuffle) and
  2800. not(shufflescalar(shuffle)) then
  2801. internalerror(2009112413);
  2802. case fromsize of
  2803. OS_32,OS_S32:
  2804. begin
  2805. fromsize:=OS_F32;
  2806. { since we are loading an integer, no conversion may be required }
  2807. if (fromsize<>tosize) then
  2808. internalerror(2009112801);
  2809. end;
  2810. OS_64,OS_S64:
  2811. begin
  2812. fromsize:=OS_F64;
  2813. { since we are loading an integer, no conversion may be required }
  2814. if (fromsize<>tosize) then
  2815. internalerror(2009112901);
  2816. end;
  2817. end;
  2818. if (fromsize<>tosize) then
  2819. tmpmmreg:=getmmregister(list,fromsize)
  2820. else
  2821. tmpmmreg:=reg;
  2822. if (ref.alignment in [1,2]) then
  2823. begin
  2824. case fromsize of
  2825. OS_F32:
  2826. begin
  2827. intreg:=getintregister(list,OS_32);
  2828. a_load_ref_reg(list,OS_32,OS_32,ref,intreg);
  2829. a_loadmm_intreg_reg(list,OS_32,OS_F32,intreg,tmpmmreg,mms_movescalar);
  2830. end;
  2831. OS_F64:
  2832. begin
  2833. reg64.reglo:=getintregister(list,OS_32);
  2834. reg64.reghi:=getintregister(list,OS_32);
  2835. cg64.a_load64_ref_reg(list,ref,reg64);
  2836. cg64.a_loadmm_intreg64_reg(list,OS_F64,reg64,tmpmmreg);
  2837. end;
  2838. else
  2839. internalerror(2009112412);
  2840. end;
  2841. end
  2842. else
  2843. begin
  2844. handle_load_store(list,A_VLDR,PF_None,tmpmmreg,ref);
  2845. end;
  2846. if (tmpmmreg<>reg) then
  2847. a_loadmm_reg_reg(list,fromsize,tosize,tmpmmreg,reg,shuffle);
  2848. end;
  2849. procedure tbasecgarm.a_loadmm_reg_ref(list: tasmlist; fromsize,tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  2850. var
  2851. intreg,
  2852. tmpmmreg : tregister;
  2853. reg64 : tregister64;
  2854. begin
  2855. if assigned(shuffle) and
  2856. not(shufflescalar(shuffle)) then
  2857. internalerror(2009112416);
  2858. case tosize of
  2859. OS_32,OS_S32:
  2860. begin
  2861. tosize:=OS_F32;
  2862. { since we are loading an integer, no conversion may be required }
  2863. if (fromsize<>tosize) then
  2864. internalerror(2009112801);
  2865. end;
  2866. OS_64,OS_S64:
  2867. begin
  2868. tosize:=OS_F64;
  2869. { since we are loading an integer, no conversion may be required }
  2870. if (fromsize<>tosize) then
  2871. internalerror(2009112901);
  2872. end;
  2873. end;
  2874. if (fromsize<>tosize) then
  2875. begin
  2876. tmpmmreg:=getmmregister(list,tosize);
  2877. a_loadmm_reg_reg(list,fromsize,tosize,reg,tmpmmreg,shuffle);
  2878. end
  2879. else
  2880. tmpmmreg:=reg;
  2881. if (ref.alignment in [1,2]) then
  2882. begin
  2883. case tosize of
  2884. OS_F32:
  2885. begin
  2886. intreg:=getintregister(list,OS_32);
  2887. a_loadmm_reg_intreg(list,OS_F32,OS_32,tmpmmreg,intreg,shuffle);
  2888. a_load_reg_ref(list,OS_32,OS_32,intreg,ref);
  2889. end;
  2890. OS_F64:
  2891. begin
  2892. reg64.reglo:=getintregister(list,OS_32);
  2893. reg64.reghi:=getintregister(list,OS_32);
  2894. cg64.a_loadmm_reg_intreg64(list,OS_F64,tmpmmreg,reg64);
  2895. cg64.a_load64_reg_ref(list,reg64,ref);
  2896. end;
  2897. else
  2898. internalerror(2009112417);
  2899. end;
  2900. end
  2901. else
  2902. begin
  2903. handle_load_store(list,A_VSTR,PF_None,tmpmmreg,ref);
  2904. end;
  2905. end;
  2906. procedure tbasecgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  2907. begin
  2908. { this code can only be used to transfer raw data, not to perform
  2909. conversions }
  2910. if (tosize<>OS_F32) then
  2911. internalerror(2009112419);
  2912. if not(fromsize in [OS_32,OS_S32]) then
  2913. internalerror(2009112420);
  2914. if assigned(shuffle) and
  2915. not shufflescalar(shuffle) then
  2916. internalerror(2009112516);
  2917. list.concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg));
  2918. end;
  2919. procedure tbasecgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize; mmreg, intreg: tregister;shuffle : pmmshuffle);
  2920. begin
  2921. { this code can only be used to transfer raw data, not to perform
  2922. conversions }
  2923. if (fromsize<>OS_F32) then
  2924. internalerror(2009112430);
  2925. if not(tosize in [OS_32,OS_S32]) then
  2926. internalerror(2009112420);
  2927. if assigned(shuffle) and
  2928. not shufflescalar(shuffle) then
  2929. internalerror(2009112514);
  2930. list.concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg));
  2931. end;
  2932. procedure tbasecgarm.a_opmm_reg_reg(list: tasmlist; op: topcg; size: tcgsize; src, dst: tregister; shuffle: pmmshuffle);
  2933. var
  2934. tmpreg: tregister;
  2935. begin
  2936. { the vfp doesn't support xor nor any other logical operation, but
  2937. this routine is used to initialise global mm regvars. We can
  2938. easily initialise an mm reg with 0 though. }
  2939. case op of
  2940. OP_XOR:
  2941. begin
  2942. if (src<>dst) or
  2943. (reg_cgsize(src)<>size) or
  2944. assigned(shuffle) then
  2945. internalerror(2009112907);
  2946. tmpreg:=getintregister(list,OS_32);
  2947. a_load_const_reg(list,OS_32,0,tmpreg);
  2948. case size of
  2949. OS_F32:
  2950. list.concat(taicpu.op_reg_reg(A_VMOV,dst,tmpreg));
  2951. OS_F64:
  2952. list.concat(taicpu.op_reg_reg_reg(A_VMOV,dst,tmpreg,tmpreg));
  2953. else
  2954. internalerror(2009112908);
  2955. end;
  2956. end
  2957. else
  2958. internalerror(2009112906);
  2959. end;
  2960. end;
  2961. procedure tbasecgarm.maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  2962. const
  2963. overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NEG];
  2964. begin
  2965. if (op in overflowops) and
  2966. (size in [OS_8,OS_S8,OS_16,OS_S16]) then
  2967. a_load_reg_reg(list,OS_32,size,dst,dst);
  2968. end;
  2969. procedure tbasecgarm.safe_mla(list : TAsmList; op1,op2,op3,op4 : TRegister);
  2970. procedure checkreg(var reg : TRegister);
  2971. var
  2972. tmpreg : TRegister;
  2973. begin
  2974. if ((GenerateThumbCode or GenerateThumb2Code) and (getsupreg(reg)=RS_R13)) or
  2975. (getsupreg(reg)=RS_R15) then
  2976. begin
  2977. tmpreg:=getintregister(list,OS_INT);
  2978. a_load_reg_reg(list,OS_INT,OS_INT,reg,tmpreg);
  2979. reg:=tmpreg;
  2980. end;
  2981. end;
  2982. begin
  2983. checkreg(op1);
  2984. checkreg(op2);
  2985. checkreg(op3);
  2986. checkreg(op4);
  2987. list.concat(taicpu.op_reg_reg_reg_reg(A_MLA,op1,op2,op3,op4));
  2988. end;
  2989. procedure tcg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  2990. begin
  2991. case op of
  2992. OP_NEG:
  2993. begin
  2994. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2995. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  2996. list.concat(taicpu.op_reg_reg_const(A_RSC,regdst.reghi,regsrc.reghi,0));
  2997. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2998. end;
  2999. OP_NOT:
  3000. begin
  3001. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  3002. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  3003. end;
  3004. else
  3005. a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);
  3006. end;
  3007. end;
  3008. procedure tcg64farm.a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);
  3009. begin
  3010. a_op64_const_reg_reg(list,op,size,value,reg,reg);
  3011. end;
  3012. procedure tcg64farm.a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);
  3013. var
  3014. ovloc : tlocation;
  3015. begin
  3016. a_op64_const_reg_reg_checkoverflow(list,op,size,value,regsrc,regdst,false,ovloc);
  3017. end;
  3018. procedure tcg64farm.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);
  3019. var
  3020. ovloc : tlocation;
  3021. begin
  3022. a_op64_reg_reg_reg_checkoverflow(list,op,size,regsrc1,regsrc2,regdst,false,ovloc);
  3023. end;
  3024. procedure tcg64farm.a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);
  3025. begin
  3026. { this code can only be used to transfer raw data, not to perform
  3027. conversions }
  3028. if (mmsize<>OS_F64) then
  3029. internalerror(2009112405);
  3030. list.concat(taicpu.op_reg_reg_reg(A_VMOV,mmreg,intreg.reglo,intreg.reghi));
  3031. end;
  3032. procedure tcg64farm.a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);
  3033. begin
  3034. { this code can only be used to transfer raw data, not to perform
  3035. conversions }
  3036. if (mmsize<>OS_F64) then
  3037. internalerror(2009112406);
  3038. list.concat(taicpu.op_reg_reg_reg(A_VMOV,intreg.reglo,intreg.reghi,mmreg));
  3039. end;
  3040. procedure tcg64farm.a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3041. var
  3042. tmpreg : tregister;
  3043. b : byte;
  3044. begin
  3045. ovloc.loc:=LOC_VOID;
  3046. case op of
  3047. OP_NEG,
  3048. OP_NOT :
  3049. internalerror(2012022501);
  3050. end;
  3051. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3052. begin
  3053. case op of
  3054. OP_ADD:
  3055. begin
  3056. if is_shifter_const(lo(value),b) then
  3057. begin
  3058. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3059. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3060. end
  3061. else
  3062. begin
  3063. tmpreg:=cg.getintregister(list,OS_32);
  3064. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3065. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3066. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3067. end;
  3068. if is_shifter_const(hi(value),b) then
  3069. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,hi(value)),PF_S))
  3070. else
  3071. begin
  3072. tmpreg:=cg.getintregister(list,OS_32);
  3073. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3074. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3075. end;
  3076. end;
  3077. OP_SUB:
  3078. begin
  3079. if is_shifter_const(lo(value),b) then
  3080. begin
  3081. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3082. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3083. end
  3084. else
  3085. begin
  3086. tmpreg:=cg.getintregister(list,OS_32);
  3087. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3088. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3089. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3090. end;
  3091. if is_shifter_const(hi(value),b) then
  3092. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))),PF_S))
  3093. else
  3094. begin
  3095. tmpreg:=cg.getintregister(list,OS_32);
  3096. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3097. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3098. end;
  3099. end;
  3100. else
  3101. internalerror(200502131);
  3102. end;
  3103. if size=OS_64 then
  3104. begin
  3105. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3106. ovloc.loc:=LOC_FLAGS;
  3107. case op of
  3108. OP_ADD:
  3109. ovloc.resflags:=F_CS;
  3110. OP_SUB:
  3111. ovloc.resflags:=F_CC;
  3112. end;
  3113. end;
  3114. end
  3115. else
  3116. begin
  3117. case op of
  3118. OP_AND,OP_OR,OP_XOR:
  3119. begin
  3120. cg.a_op_const_reg_reg(list,op,OS_32,aint(lo(value)),regsrc.reglo,regdst.reglo);
  3121. cg.a_op_const_reg_reg(list,op,OS_32,aint(hi(value)),regsrc.reghi,regdst.reghi);
  3122. end;
  3123. OP_ADD:
  3124. begin
  3125. if is_shifter_const(aint(lo(value)),b) then
  3126. begin
  3127. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3128. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3129. end
  3130. else
  3131. begin
  3132. tmpreg:=cg.getintregister(list,OS_32);
  3133. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3134. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3135. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3136. end;
  3137. if is_shifter_const(aint(hi(value)),b) then
  3138. list.concat(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3139. else
  3140. begin
  3141. tmpreg:=cg.getintregister(list,OS_32);
  3142. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  3143. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg));
  3144. end;
  3145. end;
  3146. OP_SUB:
  3147. begin
  3148. if is_shifter_const(aint(lo(value)),b) then
  3149. begin
  3150. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3151. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3152. end
  3153. else
  3154. begin
  3155. tmpreg:=cg.getintregister(list,OS_32);
  3156. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3157. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3158. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3159. end;
  3160. if is_shifter_const(aint(hi(value)),b) then
  3161. list.concat(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3162. else
  3163. begin
  3164. tmpreg:=cg.getintregister(list,OS_32);
  3165. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3166. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg));
  3167. end;
  3168. end;
  3169. else
  3170. internalerror(2003083101);
  3171. end;
  3172. end;
  3173. end;
  3174. procedure tcg64farm.a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3175. begin
  3176. ovloc.loc:=LOC_VOID;
  3177. case op of
  3178. OP_NEG,
  3179. OP_NOT :
  3180. internalerror(2012022502);
  3181. end;
  3182. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3183. begin
  3184. case op of
  3185. OP_ADD:
  3186. begin
  3187. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3188. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3189. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi),PF_S));
  3190. end;
  3191. OP_SUB:
  3192. begin
  3193. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3194. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3195. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi),PF_S));
  3196. end;
  3197. else
  3198. internalerror(2003083101);
  3199. end;
  3200. if size=OS_64 then
  3201. begin
  3202. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3203. ovloc.loc:=LOC_FLAGS;
  3204. case op of
  3205. OP_ADD:
  3206. ovloc.resflags:=F_CS;
  3207. OP_SUB:
  3208. ovloc.resflags:=F_CC;
  3209. end;
  3210. end;
  3211. end
  3212. else
  3213. begin
  3214. case op of
  3215. OP_AND,OP_OR,OP_XOR:
  3216. begin
  3217. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);
  3218. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);
  3219. end;
  3220. OP_ADD:
  3221. begin
  3222. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3223. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3224. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi));
  3225. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3226. end;
  3227. OP_SUB:
  3228. begin
  3229. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3230. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3231. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi));
  3232. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3233. end;
  3234. else
  3235. internalerror(2003083101);
  3236. end;
  3237. end;
  3238. end;
  3239. procedure tthumbcgarm.init_register_allocators;
  3240. begin
  3241. inherited init_register_allocators;
  3242. if assigned(current_procinfo) and (current_procinfo.framepointer=NR_R7) then
  3243. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3244. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6],first_int_imreg,[])
  3245. else
  3246. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3247. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7],first_int_imreg,[]);
  3248. end;
  3249. procedure tthumbcgarm.done_register_allocators;
  3250. begin
  3251. rg[R_INTREGISTER].free;
  3252. rg[R_FPUREGISTER].free;
  3253. rg[R_MMREGISTER].free;
  3254. inherited done_register_allocators;
  3255. end;
  3256. procedure tthumbcgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  3257. var
  3258. ref : treference;
  3259. r : byte;
  3260. regs : tcpuregisterset;
  3261. stackmisalignment : pint;
  3262. registerarea: DWord;
  3263. stack_parameters: Boolean;
  3264. begin
  3265. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3266. LocalSize:=align(LocalSize,4);
  3267. { call instruction does not put anything on the stack }
  3268. stackmisalignment:=0;
  3269. if not(nostackframe) then
  3270. begin
  3271. a_reg_alloc(list,NR_STACK_POINTER_REG);
  3272. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3273. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  3274. { save int registers }
  3275. reference_reset(ref,4,[]);
  3276. ref.index:=NR_STACK_POINTER_REG;
  3277. ref.addressmode:=AM_PREINDEXED;
  3278. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3279. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3280. begin
  3281. //!!!! a_reg_alloc(list,NR_R12);
  3282. //!!!! list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  3283. end;
  3284. { the (old) ARM APCS requires saving both the stack pointer (to
  3285. crawl the stack) and the PC (to identify the function this
  3286. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  3287. and R15 -- still needs updating for EABI and Darwin, they don't
  3288. need that }
  3289. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3290. regs:=regs+[RS_R7,RS_R14]
  3291. else
  3292. // if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  3293. include(regs,RS_R14);
  3294. { safely estimate stack size }
  3295. if localsize+current_settings.alignment.localalignmax+4>508 then
  3296. begin
  3297. include(rg[R_INTREGISTER].used_in_proc,RS_R4);
  3298. include(regs,RS_R4);
  3299. end;
  3300. registerarea:=0;
  3301. if regs<>[] then
  3302. begin
  3303. for r:=RS_R0 to RS_R15 do
  3304. if r in regs then
  3305. inc(registerarea,4);
  3306. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,regs));
  3307. end;
  3308. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3309. if stack_parameters or (LocalSize<>0) or
  3310. ((stackmisalignment<>0) and
  3311. ((pi_do_call in current_procinfo.flags) or
  3312. (po_assembler in current_procinfo.procdef.procoptions))) then
  3313. begin
  3314. { do we access stack parameters?
  3315. if yes, the previously estimated stacksize must be used }
  3316. if stack_parameters then
  3317. begin
  3318. if localsize>tarmprocinfo(current_procinfo).stackframesize then
  3319. begin
  3320. writeln(localsize);
  3321. writeln(tarmprocinfo(current_procinfo).stackframesize);
  3322. internalerror(2013040601);
  3323. end
  3324. else
  3325. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea;
  3326. end
  3327. else
  3328. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3329. if localsize<508 then
  3330. begin
  3331. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  3332. end
  3333. else if localsize<=1016 then
  3334. begin
  3335. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3336. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize-508));
  3337. end
  3338. else
  3339. begin
  3340. a_load_const_reg(list,OS_ADDR,-localsize,NR_R4);
  3341. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R4));
  3342. include(regs,RS_R4);
  3343. //!!!! if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  3344. //!!!! a_reg_alloc(list,NR_R12);
  3345. //!!!! a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  3346. //!!!! list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  3347. //!!!! a_reg_dealloc(list,NR_R12);
  3348. end;
  3349. end;
  3350. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3351. begin
  3352. list.concat(taicpu.op_reg_reg_const(A_ADD,current_procinfo.framepointer,NR_STACK_POINTER_REG,0));
  3353. end;
  3354. end;
  3355. end;
  3356. procedure tthumbcgarm.g_proc_exit(list: TAsmList; parasize: longint; nostackframe: boolean);
  3357. var
  3358. LocalSize : longint;
  3359. r: byte;
  3360. regs : tcpuregisterset;
  3361. registerarea : DWord;
  3362. stackmisalignment: pint;
  3363. stack_parameters : Boolean;
  3364. begin
  3365. if not(nostackframe) then
  3366. begin
  3367. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3368. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3369. include(regs,RS_R15);
  3370. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3371. include(regs,getsupreg(current_procinfo.framepointer));
  3372. registerarea:=0;
  3373. for r:=RS_R0 to RS_R15 do
  3374. if r in regs then
  3375. inc(registerarea,4);
  3376. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3377. LocalSize:=current_procinfo.calc_stackframe_size;
  3378. if stack_parameters then
  3379. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea
  3380. else
  3381. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3382. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  3383. (target_info.system in systems_darwin) then
  3384. begin
  3385. if (LocalSize<>0) or
  3386. ((stackmisalignment<>0) and
  3387. ((pi_do_call in current_procinfo.flags) or
  3388. (po_assembler in current_procinfo.procdef.procoptions))) then
  3389. begin
  3390. if LocalSize=0 then
  3391. else if LocalSize<=508 then
  3392. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  3393. else if LocalSize<=1016 then
  3394. begin
  3395. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3396. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,localsize-508));
  3397. end
  3398. else
  3399. begin
  3400. a_reg_alloc(list,NR_R3);
  3401. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R3);
  3402. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R3));
  3403. a_reg_dealloc(list,NR_R3);
  3404. end;
  3405. end;
  3406. if regs=[] then
  3407. begin
  3408. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3409. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3410. else
  3411. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3412. end
  3413. else
  3414. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,regs));
  3415. end;
  3416. end
  3417. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3418. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3419. else
  3420. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3421. end;
  3422. procedure tthumbcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3423. var
  3424. oppostfix:toppostfix;
  3425. usedtmpref: treference;
  3426. tmpreg,tmpreg2 : tregister;
  3427. dir : integer;
  3428. begin
  3429. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3430. FromSize := ToSize;
  3431. case FromSize of
  3432. { signed integer registers }
  3433. OS_8:
  3434. oppostfix:=PF_B;
  3435. OS_S8:
  3436. oppostfix:=PF_SB;
  3437. OS_16:
  3438. oppostfix:=PF_H;
  3439. OS_S16:
  3440. oppostfix:=PF_SH;
  3441. OS_32,
  3442. OS_S32:
  3443. oppostfix:=PF_None;
  3444. else
  3445. InternalError(200308298);
  3446. end;
  3447. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3448. begin
  3449. if target_info.endian=endian_big then
  3450. dir:=-1
  3451. else
  3452. dir:=1;
  3453. case FromSize of
  3454. OS_16,OS_S16:
  3455. begin
  3456. { only complicated references need an extra loadaddr }
  3457. if assigned(ref.symbol) or
  3458. (ref.index<>NR_NO) or
  3459. (ref.offset<-124) or
  3460. (ref.offset>124) or
  3461. { sometimes the compiler reused registers }
  3462. (reg=ref.index) or
  3463. (reg=ref.base) then
  3464. begin
  3465. tmpreg2:=getintregister(list,OS_INT);
  3466. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3467. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment,ref.volatility);
  3468. end
  3469. else
  3470. usedtmpref:=ref;
  3471. if target_info.endian=endian_big then
  3472. inc(usedtmpref.offset,1);
  3473. tmpreg:=getintregister(list,OS_INT);
  3474. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3475. inc(usedtmpref.offset,dir);
  3476. if FromSize=OS_16 then
  3477. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3478. else
  3479. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3480. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3481. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3482. end;
  3483. OS_32,OS_S32:
  3484. begin
  3485. tmpreg:=getintregister(list,OS_INT);
  3486. { only complicated references need an extra loadaddr }
  3487. if assigned(ref.symbol) or
  3488. (ref.index<>NR_NO) or
  3489. (ref.offset<-124) or
  3490. (ref.offset>124) or
  3491. { sometimes the compiler reused registers }
  3492. (reg=ref.index) or
  3493. (reg=ref.base) then
  3494. begin
  3495. tmpreg2:=getintregister(list,OS_INT);
  3496. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3497. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment,ref.volatility);
  3498. end
  3499. else
  3500. usedtmpref:=ref;
  3501. if ref.alignment=2 then
  3502. begin
  3503. if target_info.endian=endian_big then
  3504. inc(usedtmpref.offset,2);
  3505. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  3506. inc(usedtmpref.offset,dir*2);
  3507. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  3508. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3509. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3510. end
  3511. else
  3512. begin
  3513. if target_info.endian=endian_big then
  3514. inc(usedtmpref.offset,3);
  3515. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3516. inc(usedtmpref.offset,dir);
  3517. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3518. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3519. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3520. inc(usedtmpref.offset,dir);
  3521. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3522. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3523. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3524. inc(usedtmpref.offset,dir);
  3525. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3526. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,24));
  3527. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3528. end;
  3529. end
  3530. else
  3531. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3532. end;
  3533. end
  3534. else
  3535. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3536. if (fromsize=OS_S8) and (tosize = OS_16) then
  3537. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  3538. end;
  3539. procedure tthumbcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3540. var
  3541. l : tasmlabel;
  3542. hr : treference;
  3543. begin
  3544. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3545. internalerror(2002090902);
  3546. if is_thumb_imm(a) then
  3547. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3548. else
  3549. begin
  3550. reference_reset(hr,4,[]);
  3551. current_asmdata.getjumplabel(l);
  3552. cg.a_label(current_procinfo.aktlocaldata,l);
  3553. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3554. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3555. hr.symbol:=l;
  3556. hr.base:=NR_PC;
  3557. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3558. end;
  3559. end;
  3560. procedure tthumbcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  3561. var
  3562. hsym : tsym;
  3563. href,
  3564. tmpref : treference;
  3565. paraloc : Pcgparalocation;
  3566. l : TAsmLabel;
  3567. begin
  3568. { calculate the parameter info for the procdef }
  3569. procdef.init_paraloc_info(callerside);
  3570. hsym:=tsym(procdef.parast.Find('self'));
  3571. if not(assigned(hsym) and
  3572. (hsym.typ=paravarsym)) then
  3573. internalerror(200305251);
  3574. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  3575. while paraloc<>nil do
  3576. with paraloc^ do
  3577. begin
  3578. case loc of
  3579. LOC_REGISTER:
  3580. begin
  3581. if is_thumb_imm(ioffset) then
  3582. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  3583. else
  3584. begin
  3585. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3586. reference_reset(tmpref,4,[]);
  3587. current_asmdata.getjumplabel(l);
  3588. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3589. cg.a_label(current_procinfo.aktlocaldata,l);
  3590. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3591. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3592. tmpref.symbol:=l;
  3593. tmpref.base:=NR_PC;
  3594. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3595. a_op_reg_reg(list,OP_SUB,size,NR_R4,register);
  3596. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3597. end;
  3598. end;
  3599. LOC_REFERENCE:
  3600. begin
  3601. { offset in the wrapper needs to be adjusted for the stored
  3602. return address }
  3603. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),sizeof(pint),[]);
  3604. if is_thumb_imm(ioffset) then
  3605. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  3606. else
  3607. begin
  3608. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3609. reference_reset(tmpref,4,[]);
  3610. current_asmdata.getjumplabel(l);
  3611. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3612. cg.a_label(current_procinfo.aktlocaldata,l);
  3613. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3614. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3615. tmpref.symbol:=l;
  3616. tmpref.base:=NR_PC;
  3617. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3618. a_op_reg_ref(list,OP_SUB,size,NR_R4,href);
  3619. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3620. end;
  3621. end
  3622. else
  3623. internalerror(200309189);
  3624. end;
  3625. paraloc:=next;
  3626. end;
  3627. end;
  3628. function tthumbcgarm.handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference;
  3629. var
  3630. href : treference;
  3631. tmpreg : TRegister;
  3632. begin
  3633. href:=ref;
  3634. if { LDR/STR limitations }
  3635. (
  3636. (((op=A_LDR) and (oppostfix=PF_None)) or
  3637. ((op=A_STR) and (oppostfix=PF_None))) and
  3638. (ref.base<>NR_STACK_POINTER_REG) and
  3639. (abs(ref.offset)>124)
  3640. ) or
  3641. { LDRB/STRB limitations }
  3642. (
  3643. (((op=A_LDR) and (oppostfix=PF_B)) or
  3644. ((op=A_LDRB) and (oppostfix=PF_None)) or
  3645. ((op=A_STR) and (oppostfix=PF_B)) or
  3646. ((op=A_STRB) and (oppostfix=PF_None))) and
  3647. ((ref.base=NR_STACK_POINTER_REG) or
  3648. (ref.index=NR_STACK_POINTER_REG) or
  3649. (abs(ref.offset)>31)
  3650. )
  3651. ) or
  3652. { LDRH/STRH limitations }
  3653. (
  3654. (((op=A_LDR) and (oppostfix=PF_H)) or
  3655. ((op=A_LDRH) and (oppostfix=PF_None)) or
  3656. ((op=A_STR) and (oppostfix=PF_H)) or
  3657. ((op=A_STRH) and (oppostfix=PF_None))) and
  3658. ((ref.base=NR_STACK_POINTER_REG) or
  3659. (ref.index=NR_STACK_POINTER_REG) or
  3660. (abs(ref.offset)>62) or
  3661. ((abs(ref.offset) mod 2)<>0)
  3662. )
  3663. ) then
  3664. begin
  3665. tmpreg:=getintregister(list,OS_ADDR);
  3666. a_loadaddr_ref_reg(list,ref,tmpreg);
  3667. reference_reset_base(href,tmpreg,0,ref.alignment,ref.volatility);
  3668. end
  3669. else if (op=A_LDR) and
  3670. (oppostfix in [PF_None]) and
  3671. (ref.base=NR_STACK_POINTER_REG) and
  3672. (abs(ref.offset)>1020) then
  3673. begin
  3674. tmpreg:=getintregister(list,OS_ADDR);
  3675. a_loadaddr_ref_reg(list,ref,tmpreg);
  3676. reference_reset_base(href,tmpreg,0,ref.alignment,ref.volatility);
  3677. end
  3678. else if (op=A_LDR) and
  3679. ((oppostfix in [PF_SH,PF_SB]) or
  3680. (abs(ref.offset)>124)) then
  3681. begin
  3682. tmpreg:=getintregister(list,OS_ADDR);
  3683. a_loadaddr_ref_reg(list,ref,tmpreg);
  3684. reference_reset_base(href,tmpreg,0,ref.alignment,ref.volatility);
  3685. end;
  3686. Result:=inherited handle_load_store(list, op, oppostfix, reg, href);
  3687. end;
  3688. procedure tthumbcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  3689. var
  3690. tmpreg : tregister;
  3691. begin
  3692. case op of
  3693. OP_NEG:
  3694. list.concat(taicpu.op_reg_reg(A_NEG,dst,src));
  3695. OP_NOT:
  3696. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  3697. OP_DIV,OP_IDIV:
  3698. internalerror(200308284);
  3699. OP_ROL:
  3700. begin
  3701. if not(size in [OS_32,OS_S32]) then
  3702. internalerror(2008072801);
  3703. { simulate ROL by ror'ing 32-value }
  3704. tmpreg:=getintregister(list,OS_32);
  3705. a_load_const_reg(list,OS_32,32,tmpreg);
  3706. list.concat(taicpu.op_reg_reg(A_SUB,tmpreg,src));
  3707. list.concat(taicpu.op_reg_reg(A_ROR,dst,src));
  3708. end;
  3709. else
  3710. begin
  3711. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3712. list.concat(setoppostfix(
  3713. taicpu.op_reg_reg(op_reg_opcg2asmop[op],dst,src),op_reg_postfix[op]));
  3714. end;
  3715. end;
  3716. maybeadjustresult(list,op,size,dst);
  3717. end;
  3718. procedure tthumbcgarm.a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);
  3719. var
  3720. tmpreg : tregister;
  3721. {$ifdef DUMMY}
  3722. l1 : longint;
  3723. {$endif DUMMY}
  3724. begin
  3725. //!!! ovloc.loc:=LOC_VOID;
  3726. if {$ifopt R+}(a<>-2147483648) and{$endif} {!!!!!! not setflags and } is_thumb_imm(-a) then
  3727. case op of
  3728. OP_ADD:
  3729. begin
  3730. op:=OP_SUB;
  3731. a:=aint(dword(-a));
  3732. end;
  3733. OP_SUB:
  3734. begin
  3735. op:=OP_ADD;
  3736. a:=aint(dword(-a));
  3737. end
  3738. end;
  3739. if is_thumb_imm(a) and (op in [OP_ADD,OP_SUB]) then
  3740. begin
  3741. // if cgsetflags or setflags then
  3742. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3743. list.concat(setoppostfix(
  3744. taicpu.op_reg_const(op_reg_opcg2asmop[op],dst,a),op_reg_postfix[op]));
  3745. if (cgsetflags {!!! or setflags }) and (size in [OS_8,OS_16,OS_32]) then
  3746. begin
  3747. //!!! ovloc.loc:=LOC_FLAGS;
  3748. case op of
  3749. OP_ADD:
  3750. //!!! ovloc.resflags:=F_CS;
  3751. ;
  3752. OP_SUB:
  3753. //!!! ovloc.resflags:=F_CC;
  3754. ;
  3755. end;
  3756. end;
  3757. end
  3758. else
  3759. begin
  3760. { there could be added some more sophisticated optimizations }
  3761. if (op in [OP_MUL,OP_IMUL,OP_DIV,OP_IDIV]) and (a=1) then
  3762. a_load_reg_reg(list,size,size,dst,dst)
  3763. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  3764. a_load_const_reg(list,size,0,dst)
  3765. else if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  3766. a_op_reg_reg(list,OP_NEG,size,dst,dst)
  3767. { we do this here instead in the peephole optimizer because
  3768. it saves us a register }
  3769. {$ifdef DUMMY}
  3770. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  3771. a_op_const_reg_reg(list,OP_SHL,size,l1,dst,dst)
  3772. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  3773. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  3774. begin
  3775. if l1>32 then{roozbeh does this ever happen?}
  3776. internalerror(200308296);
  3777. shifterop_reset(so);
  3778. so.shiftmode:=SM_LSL;
  3779. so.shiftimm:=l1;
  3780. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,dst,so));
  3781. end
  3782. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  3783. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  3784. begin
  3785. if l1>32 then{does this ever happen?}
  3786. internalerror(201205181);
  3787. shifterop_reset(so);
  3788. so.shiftmode:=SM_LSL;
  3789. so.shiftimm:=l1;
  3790. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,dst,dst,so));
  3791. end
  3792. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,dst,dst) then
  3793. begin
  3794. { nothing to do on success }
  3795. end
  3796. {$endif DUMMY}
  3797. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  3798. Just using mov x, #0 might allow some easier optimizations down the line. }
  3799. else if (op = OP_AND) and (dword(a)=0) then
  3800. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  3801. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  3802. else if (op = OP_AND) and (not(dword(a))=0) then
  3803. // do nothing
  3804. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  3805. broader range of shifterconstants.}
  3806. {$ifdef DUMMY}
  3807. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  3808. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,not(dword(a))))
  3809. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  3810. begin
  3811. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm1));
  3812. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  3813. end
  3814. else if (op in [OP_ADD, OP_SUB, OP_OR]) and
  3815. not(cgsetflags or setflags) and
  3816. split_into_shifter_const(a, imm1, imm2) then
  3817. begin
  3818. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm1));
  3819. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  3820. end
  3821. {$endif DUMMY}
  3822. else if (op in [OP_SHL, OP_SHR, OP_SAR]) then
  3823. begin
  3824. list.concat(taicpu.op_reg_reg_const(op_reg_opcg2asmop[op],dst,dst,a));
  3825. end
  3826. else
  3827. begin
  3828. tmpreg:=getintregister(list,size);
  3829. a_load_const_reg(list,size,a,tmpreg);
  3830. a_op_reg_reg(list,op,size,tmpreg,dst);
  3831. end;
  3832. end;
  3833. maybeadjustresult(list,op,size,dst);
  3834. end;
  3835. procedure tthumbcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister);
  3836. begin
  3837. if (op=OP_ADD) and (src=NR_R13) and (dst<>NR_R13) and ((a mod 4)=0) and (a>0) and (a<=1020) then
  3838. list.concat(taicpu.op_reg_reg_const(A_ADD,dst,src,a))
  3839. else
  3840. inherited a_op_const_reg_reg(list,op,size,a,src,dst);
  3841. end;
  3842. procedure tthumbcgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  3843. var
  3844. l1,l2 : tasmlabel;
  3845. ai : taicpu;
  3846. begin
  3847. current_asmdata.getjumplabel(l1);
  3848. current_asmdata.getjumplabel(l2);
  3849. ai:=setcondition(taicpu.op_sym(A_B,l1),flags_to_cond(f));
  3850. ai.is_jmp:=true;
  3851. list.concat(ai);
  3852. list.concat(taicpu.op_reg_const(A_MOV,reg,0));
  3853. list.concat(taicpu.op_sym(A_B,l2));
  3854. cg.a_label(list,l1);
  3855. list.concat(taicpu.op_reg_const(A_MOV,reg,1));
  3856. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3857. cg.a_label(list,l2);
  3858. end;
  3859. procedure tthumb2cgarm.init_register_allocators;
  3860. begin
  3861. inherited init_register_allocators;
  3862. { currently, we save R14 always, so we can use it }
  3863. if (target_info.system<>system_arm_darwin) then
  3864. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3865. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3866. RS_R9,RS_R10,RS_R12,RS_R14],first_int_imreg,[])
  3867. else
  3868. { r9 is not available on Darwin according to the llvm code generator }
  3869. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3870. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3871. RS_R10,RS_R12,RS_R14],first_int_imreg,[]);
  3872. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  3873. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  3874. if current_settings.fputype in [fpu_vfpv3,fpu_vfpv4] then
  3875. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3876. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3877. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  3878. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3879. ],first_mm_imreg,[])
  3880. else if current_settings.fputype in [fpu_fpv4_s16,fpu_vfpv3_d16] then
  3881. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3882. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3883. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3884. ],first_mm_imreg,[])
  3885. else
  3886. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBNONE,
  3887. [RS_S0,RS_S1,RS_R2,RS_R3,RS_R4,RS_S31],first_mm_imreg,[]);
  3888. end;
  3889. procedure tthumb2cgarm.done_register_allocators;
  3890. begin
  3891. rg[R_INTREGISTER].free;
  3892. rg[R_FPUREGISTER].free;
  3893. rg[R_MMREGISTER].free;
  3894. inherited done_register_allocators;
  3895. end;
  3896. procedure tthumb2cgarm.a_call_reg(list : TAsmList;reg: tregister);
  3897. begin
  3898. list.concat(taicpu.op_reg(A_BLX, reg));
  3899. {
  3900. the compiler does not properly set this flag anymore in pass 1, and
  3901. for now we only need it after pass 2 (I hope) (JM)
  3902. if not(pi_do_call in current_procinfo.flags) then
  3903. internalerror(2003060703);
  3904. }
  3905. include(current_procinfo.flags,pi_do_call);
  3906. end;
  3907. procedure tthumb2cgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3908. var
  3909. l : tasmlabel;
  3910. hr : treference;
  3911. begin
  3912. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3913. internalerror(2002090902);
  3914. if is_thumb32_imm(a) then
  3915. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3916. else if is_thumb32_imm(not(a)) then
  3917. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  3918. else if (a and $FFFF)=a then
  3919. list.concat(taicpu.op_reg_const(A_MOVW,reg,a))
  3920. else
  3921. begin
  3922. reference_reset(hr,4,[]);
  3923. current_asmdata.getjumplabel(l);
  3924. cg.a_label(current_procinfo.aktlocaldata,l);
  3925. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3926. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3927. hr.symbol:=l;
  3928. hr.base:=NR_PC;
  3929. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3930. end;
  3931. end;
  3932. procedure tthumb2cgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3933. var
  3934. oppostfix:toppostfix;
  3935. usedtmpref: treference;
  3936. tmpreg,tmpreg2 : tregister;
  3937. so : tshifterop;
  3938. dir : integer;
  3939. begin
  3940. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3941. FromSize := ToSize;
  3942. case FromSize of
  3943. { signed integer registers }
  3944. OS_8:
  3945. oppostfix:=PF_B;
  3946. OS_S8:
  3947. oppostfix:=PF_SB;
  3948. OS_16:
  3949. oppostfix:=PF_H;
  3950. OS_S16:
  3951. oppostfix:=PF_SH;
  3952. OS_32,
  3953. OS_S32:
  3954. oppostfix:=PF_None;
  3955. else
  3956. InternalError(200308299);
  3957. end;
  3958. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3959. begin
  3960. if target_info.endian=endian_big then
  3961. dir:=-1
  3962. else
  3963. dir:=1;
  3964. case FromSize of
  3965. OS_16,OS_S16:
  3966. begin
  3967. { only complicated references need an extra loadaddr }
  3968. if assigned(ref.symbol) or
  3969. (ref.index<>NR_NO) or
  3970. (ref.offset<-255) or
  3971. (ref.offset>4094) or
  3972. { sometimes the compiler reused registers }
  3973. (reg=ref.index) or
  3974. (reg=ref.base) then
  3975. begin
  3976. tmpreg2:=getintregister(list,OS_INT);
  3977. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3978. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment,ref.volatility);
  3979. end
  3980. else
  3981. usedtmpref:=ref;
  3982. if target_info.endian=endian_big then
  3983. inc(usedtmpref.offset,1);
  3984. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  3985. tmpreg:=getintregister(list,OS_INT);
  3986. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3987. inc(usedtmpref.offset,dir);
  3988. if FromSize=OS_16 then
  3989. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3990. else
  3991. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3992. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  3993. end;
  3994. OS_32,OS_S32:
  3995. begin
  3996. tmpreg:=getintregister(list,OS_INT);
  3997. { only complicated references need an extra loadaddr }
  3998. if assigned(ref.symbol) or
  3999. (ref.index<>NR_NO) or
  4000. (ref.offset<-255) or
  4001. (ref.offset>4092) or
  4002. { sometimes the compiler reused registers }
  4003. (reg=ref.index) or
  4004. (reg=ref.base) then
  4005. begin
  4006. tmpreg2:=getintregister(list,OS_INT);
  4007. a_loadaddr_ref_reg(list,ref,tmpreg2);
  4008. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment,ref.volatility);
  4009. end
  4010. else
  4011. usedtmpref:=ref;
  4012. shifterop_reset(so);so.shiftmode:=SM_LSL;
  4013. if ref.alignment=2 then
  4014. begin
  4015. if target_info.endian=endian_big then
  4016. inc(usedtmpref.offset,2);
  4017. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  4018. inc(usedtmpref.offset,dir*2);
  4019. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  4020. so.shiftimm:=16;
  4021. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4022. end
  4023. else
  4024. begin
  4025. if target_info.endian=endian_big then
  4026. inc(usedtmpref.offset,3);
  4027. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  4028. inc(usedtmpref.offset,dir);
  4029. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4030. so.shiftimm:=8;
  4031. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4032. inc(usedtmpref.offset,dir);
  4033. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4034. so.shiftimm:=16;
  4035. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4036. inc(usedtmpref.offset,dir);
  4037. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4038. so.shiftimm:=24;
  4039. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4040. end;
  4041. end
  4042. else
  4043. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4044. end;
  4045. end
  4046. else
  4047. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4048. if (fromsize=OS_S8) and (tosize = OS_16) then
  4049. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  4050. end;
  4051. procedure tthumb2cgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  4052. begin
  4053. if op = OP_NOT then
  4054. begin
  4055. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  4056. case size of
  4057. OS_8: list.concat(taicpu.op_reg_reg(A_UXTB,dst,dst));
  4058. OS_S8: list.concat(taicpu.op_reg_reg(A_SXTB,dst,dst));
  4059. OS_16: list.concat(taicpu.op_reg_reg(A_UXTH,dst,dst));
  4060. OS_S16: list.concat(taicpu.op_reg_reg(A_SXTH,dst,dst));
  4061. end;
  4062. end
  4063. else
  4064. inherited a_op_reg_reg(list, op, size, src, dst);
  4065. end;
  4066. procedure tthumb2cgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4067. var
  4068. shift, width : byte;
  4069. tmpreg : tregister;
  4070. so : tshifterop;
  4071. l1 : longint;
  4072. begin
  4073. ovloc.loc:=LOC_VOID;
  4074. if {$ifopt R+}(a<>-2147483648) and{$endif} is_shifter_const(-a,shift) then
  4075. case op of
  4076. OP_ADD:
  4077. begin
  4078. op:=OP_SUB;
  4079. a:=aint(dword(-a));
  4080. end;
  4081. OP_SUB:
  4082. begin
  4083. op:=OP_ADD;
  4084. a:=aint(dword(-a));
  4085. end
  4086. end;
  4087. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  4088. case op of
  4089. OP_NEG,OP_NOT,
  4090. OP_DIV,OP_IDIV:
  4091. internalerror(200308285);
  4092. OP_SHL:
  4093. begin
  4094. if a>32 then
  4095. internalerror(2014020703);
  4096. if a<>0 then
  4097. begin
  4098. shifterop_reset(so);
  4099. so.shiftmode:=SM_LSL;
  4100. so.shiftimm:=a;
  4101. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4102. end
  4103. else
  4104. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4105. end;
  4106. OP_ROL:
  4107. begin
  4108. if a>32 then
  4109. internalerror(2014020704);
  4110. if a<>0 then
  4111. begin
  4112. shifterop_reset(so);
  4113. so.shiftmode:=SM_ROR;
  4114. so.shiftimm:=32-a;
  4115. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4116. end
  4117. else
  4118. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4119. end;
  4120. OP_ROR:
  4121. begin
  4122. if a>32 then
  4123. internalerror(2014020705);
  4124. if a<>0 then
  4125. begin
  4126. shifterop_reset(so);
  4127. so.shiftmode:=SM_ROR;
  4128. so.shiftimm:=a;
  4129. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4130. end
  4131. else
  4132. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4133. end;
  4134. OP_SHR:
  4135. begin
  4136. if a>32 then
  4137. internalerror(200308292);
  4138. shifterop_reset(so);
  4139. if a<>0 then
  4140. begin
  4141. so.shiftmode:=SM_LSR;
  4142. so.shiftimm:=a;
  4143. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4144. end
  4145. else
  4146. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4147. end;
  4148. OP_SAR:
  4149. begin
  4150. if a>32 then
  4151. internalerror(200308295);
  4152. if a<>0 then
  4153. begin
  4154. shifterop_reset(so);
  4155. so.shiftmode:=SM_ASR;
  4156. so.shiftimm:=a;
  4157. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4158. end
  4159. else
  4160. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4161. end;
  4162. else
  4163. if (op in [OP_SUB, OP_ADD]) and
  4164. ((a < 0) or
  4165. (a > 4095)) then
  4166. begin
  4167. tmpreg:=getintregister(list,size);
  4168. a_load_const_reg(list, size, a, tmpreg);
  4169. if cgsetflags or setflags then
  4170. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4171. list.concat(setoppostfix(
  4172. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4173. end
  4174. else
  4175. begin
  4176. if cgsetflags or setflags then
  4177. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4178. list.concat(setoppostfix(
  4179. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4180. end;
  4181. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  4182. begin
  4183. ovloc.loc:=LOC_FLAGS;
  4184. case op of
  4185. OP_ADD:
  4186. ovloc.resflags:=F_CS;
  4187. OP_SUB:
  4188. ovloc.resflags:=F_CC;
  4189. end;
  4190. end;
  4191. end
  4192. else
  4193. begin
  4194. { there could be added some more sophisticated optimizations }
  4195. if (op in [OP_MUL,OP_IMUL]) and (a=1) then
  4196. a_load_reg_reg(list,size,size,src,dst)
  4197. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  4198. a_load_const_reg(list,size,0,dst)
  4199. else if (op in [OP_IMUL]) and (a=-1) then
  4200. a_op_reg_reg(list,OP_NEG,size,src,dst)
  4201. { we do this here instead in the peephole optimizer because
  4202. it saves us a register }
  4203. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  4204. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  4205. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  4206. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  4207. begin
  4208. if l1>32 then{roozbeh does this ever happen?}
  4209. internalerror(200308296);
  4210. shifterop_reset(so);
  4211. so.shiftmode:=SM_LSL;
  4212. so.shiftimm:=l1;
  4213. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  4214. end
  4215. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  4216. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  4217. begin
  4218. if l1>32 then{does this ever happen?}
  4219. internalerror(201205181);
  4220. shifterop_reset(so);
  4221. so.shiftmode:=SM_LSL;
  4222. so.shiftimm:=l1;
  4223. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  4224. end
  4225. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  4226. begin
  4227. { nothing to do on success }
  4228. end
  4229. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  4230. Just using mov x, #0 might allow some easier optimizations down the line. }
  4231. else if (op = OP_AND) and (dword(a)=0) then
  4232. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  4233. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  4234. else if (op = OP_AND) and (not(dword(a))=0) then
  4235. list.concat(taicpu.op_reg_reg(A_MOV,dst,src))
  4236. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  4237. broader range of shifterconstants.}
  4238. {else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  4239. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))}
  4240. else if (op = OP_AND) and is_thumb32_imm(a) then
  4241. list.concat(taicpu.op_reg_reg_const(A_AND,dst,src,dword(a)))
  4242. else if (op = OP_AND) and (a = $FFFF) then
  4243. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  4244. else if (op = OP_AND) and is_thumb32_imm(not(dword(a))) then
  4245. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  4246. else if (op = OP_AND) and is_continuous_mask(not(a), shift, width) then
  4247. begin
  4248. a_load_reg_reg(list,size,size,src,dst);
  4249. list.concat(taicpu.op_reg_const_const(A_BFC,dst,shift,width))
  4250. end
  4251. else
  4252. begin
  4253. tmpreg:=getintregister(list,size);
  4254. a_load_const_reg(list,size,a,tmpreg);
  4255. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  4256. end;
  4257. end;
  4258. maybeadjustresult(list,op,size,dst);
  4259. end;
  4260. const
  4261. op_reg_reg_opcg2asmopThumb2: array[TOpCG] of tasmop =
  4262. (A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NONE,A_MVN,A_ORR,
  4263. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  4264. procedure tthumb2cgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4265. var
  4266. so : tshifterop;
  4267. tmpreg,overflowreg : tregister;
  4268. asmop : tasmop;
  4269. begin
  4270. ovloc.loc:=LOC_VOID;
  4271. case op of
  4272. OP_NEG,OP_NOT:
  4273. internalerror(200308286);
  4274. OP_ROL:
  4275. begin
  4276. if not(size in [OS_32,OS_S32]) then
  4277. internalerror(2008072801);
  4278. { simulate ROL by ror'ing 32-value }
  4279. tmpreg:=getintregister(list,OS_32);
  4280. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,32));
  4281. list.concat(taicpu.op_reg_reg_reg(A_SUB,src1,tmpreg,src1));
  4282. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4283. end;
  4284. OP_ROR:
  4285. begin
  4286. if not(size in [OS_32,OS_S32]) then
  4287. internalerror(2008072802);
  4288. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4289. end;
  4290. OP_IMUL,
  4291. OP_MUL:
  4292. begin
  4293. if cgsetflags or setflags then
  4294. begin
  4295. overflowreg:=getintregister(list,size);
  4296. if op=OP_IMUL then
  4297. asmop:=A_SMULL
  4298. else
  4299. asmop:=A_UMULL;
  4300. { the arm doesn't allow that rd and rm are the same }
  4301. if dst=src2 then
  4302. begin
  4303. if dst<>src1 then
  4304. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  4305. else
  4306. begin
  4307. tmpreg:=getintregister(list,size);
  4308. a_load_reg_reg(list,size,size,src2,dst);
  4309. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  4310. end;
  4311. end
  4312. else
  4313. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  4314. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4315. if op=OP_IMUL then
  4316. begin
  4317. shifterop_reset(so);
  4318. so.shiftmode:=SM_ASR;
  4319. so.shiftimm:=31;
  4320. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  4321. end
  4322. else
  4323. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  4324. ovloc.loc:=LOC_FLAGS;
  4325. ovloc.resflags:=F_NE;
  4326. end
  4327. else
  4328. begin
  4329. { the arm doesn't allow that rd and rm are the same }
  4330. if dst=src2 then
  4331. begin
  4332. if dst<>src1 then
  4333. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  4334. else
  4335. begin
  4336. tmpreg:=getintregister(list,size);
  4337. a_load_reg_reg(list,size,size,src2,dst);
  4338. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  4339. end;
  4340. end
  4341. else
  4342. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  4343. end;
  4344. end;
  4345. else
  4346. begin
  4347. if cgsetflags or setflags then
  4348. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4349. {$ifdef dummy}
  4350. { R13 is not allowed for certain instruction operands }
  4351. if op_reg_reg_opcg2asmopThumb2[op] in [A_ADD,A_SUB,A_AND,A_BIC,A_EOR] then
  4352. begin
  4353. if getsupreg(dst)=RS_R13 then
  4354. begin
  4355. tmpreg:=getintregister(list,OS_INT);
  4356. a_load_reg_reg(list,OS_INT,OS_INT,dst,tmpreg);
  4357. dst:=tmpreg;
  4358. end;
  4359. if getsupreg(src1)=RS_R13 then
  4360. begin
  4361. tmpreg:=getintregister(list,OS_INT);
  4362. a_load_reg_reg(list,OS_INT,OS_INT,src1,tmpreg);
  4363. src1:=tmpreg;
  4364. end;
  4365. end;
  4366. {$endif}
  4367. list.concat(setoppostfix(
  4368. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmopThumb2[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4369. end;
  4370. end;
  4371. maybeadjustresult(list,op,size,dst);
  4372. end;
  4373. procedure tthumb2cgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  4374. begin
  4375. list.concat(taicpu.op_cond(A_ITE, flags_to_cond(f)));
  4376. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  4377. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  4378. end;
  4379. procedure tthumb2cgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  4380. var
  4381. ref : treference;
  4382. shift : byte;
  4383. firstfloatreg,lastfloatreg,
  4384. r : byte;
  4385. regs : tcpuregisterset;
  4386. stackmisalignment: pint;
  4387. begin
  4388. LocalSize:=align(LocalSize,4);
  4389. { call instruction does not put anything on the stack }
  4390. stackmisalignment:=0;
  4391. if not(nostackframe) then
  4392. begin
  4393. firstfloatreg:=RS_NO;
  4394. lastfloatreg:=RS_NO;
  4395. { save floating point registers? }
  4396. for r:=RS_F0 to RS_F7 do
  4397. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4398. begin
  4399. if firstfloatreg=RS_NO then
  4400. firstfloatreg:=r;
  4401. lastfloatreg:=r;
  4402. inc(stackmisalignment,12);
  4403. end;
  4404. a_reg_alloc(list,NR_STACK_POINTER_REG);
  4405. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4406. begin
  4407. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  4408. a_reg_alloc(list,NR_R12);
  4409. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  4410. end;
  4411. { save int registers }
  4412. reference_reset(ref,4,[]);
  4413. ref.index:=NR_STACK_POINTER_REG;
  4414. ref.addressmode:=AM_PREINDEXED;
  4415. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4416. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4417. regs:=regs+[RS_FRAME_POINTER_REG,RS_R14]
  4418. else if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  4419. include(regs,RS_R14);
  4420. if regs<>[] then
  4421. begin
  4422. for r:=RS_R0 to RS_R15 do
  4423. if (r in regs) then
  4424. inc(stackmisalignment,4);
  4425. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4426. end;
  4427. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4428. begin
  4429. { the framepointer now points to the saved R15, so the saved
  4430. framepointer is at R11-12 (for get_caller_frame) }
  4431. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  4432. a_reg_dealloc(list,NR_R12);
  4433. end;
  4434. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4435. if (LocalSize<>0) or
  4436. ((stackmisalignment<>0) and
  4437. ((pi_do_call in current_procinfo.flags) or
  4438. (po_assembler in current_procinfo.procdef.procoptions))) then
  4439. begin
  4440. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4441. if not(is_shifter_const(localsize,shift)) then
  4442. begin
  4443. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  4444. a_reg_alloc(list,NR_R12);
  4445. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4446. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  4447. a_reg_dealloc(list,NR_R12);
  4448. end
  4449. else
  4450. begin
  4451. a_reg_dealloc(list,NR_R12);
  4452. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  4453. end;
  4454. end;
  4455. if firstfloatreg<>RS_NO then
  4456. begin
  4457. reference_reset(ref,4,[]);
  4458. if tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023 then
  4459. begin
  4460. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  4461. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4462. ref.base:=NR_R12;
  4463. end
  4464. else
  4465. begin
  4466. ref.base:=current_procinfo.framepointer;
  4467. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  4468. end;
  4469. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4470. lastfloatreg-firstfloatreg+1,ref));
  4471. end;
  4472. end;
  4473. end;
  4474. procedure tthumb2cgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  4475. var
  4476. ref : treference;
  4477. firstfloatreg,lastfloatreg,
  4478. r : byte;
  4479. shift : byte;
  4480. regs : tcpuregisterset;
  4481. LocalSize : longint;
  4482. stackmisalignment: pint;
  4483. begin
  4484. if not(nostackframe) then
  4485. begin
  4486. stackmisalignment:=0;
  4487. { restore floating point register }
  4488. firstfloatreg:=RS_NO;
  4489. lastfloatreg:=RS_NO;
  4490. { save floating point registers? }
  4491. for r:=RS_F0 to RS_F7 do
  4492. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4493. begin
  4494. if firstfloatreg=RS_NO then
  4495. firstfloatreg:=r;
  4496. lastfloatreg:=r;
  4497. { floating point register space is already included in
  4498. localsize below by calc_stackframe_size
  4499. inc(stackmisalignment,12);
  4500. }
  4501. end;
  4502. if firstfloatreg<>RS_NO then
  4503. begin
  4504. reference_reset(ref,4,[]);
  4505. if tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023 then
  4506. begin
  4507. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  4508. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4509. ref.base:=NR_R12;
  4510. end
  4511. else
  4512. begin
  4513. ref.base:=current_procinfo.framepointer;
  4514. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  4515. end;
  4516. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4517. lastfloatreg-firstfloatreg+1,ref));
  4518. end;
  4519. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4520. if (pi_do_call in current_procinfo.flags) or (regs<>[]) then
  4521. begin
  4522. exclude(regs,RS_R14);
  4523. include(regs,RS_R15);
  4524. end;
  4525. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  4526. regs:=regs+[RS_FRAME_POINTER_REG,RS_R15];
  4527. for r:=RS_R0 to RS_R15 do
  4528. if (r in regs) then
  4529. inc(stackmisalignment,4);
  4530. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4531. LocalSize:=current_procinfo.calc_stackframe_size;
  4532. if (LocalSize<>0) or
  4533. ((stackmisalignment<>0) and
  4534. ((pi_do_call in current_procinfo.flags) or
  4535. (po_assembler in current_procinfo.procdef.procoptions))) then
  4536. begin
  4537. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4538. if not(is_shifter_const(LocalSize,shift)) then
  4539. begin
  4540. a_reg_alloc(list,NR_R12);
  4541. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4542. list.concat(taicpu.op_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_R12));
  4543. a_reg_dealloc(list,NR_R12);
  4544. end
  4545. else
  4546. begin
  4547. a_reg_dealloc(list,NR_R12);
  4548. list.concat(taicpu.op_reg_const(A_ADD,NR_STACK_POINTER_REG,LocalSize));
  4549. end;
  4550. end;
  4551. if regs=[] then
  4552. list.concat(taicpu.op_reg_reg(A_MOV,NR_R15,NR_R14))
  4553. else
  4554. begin
  4555. reference_reset(ref,4,[]);
  4556. ref.index:=NR_STACK_POINTER_REG;
  4557. ref.addressmode:=AM_PREINDEXED;
  4558. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4559. end;
  4560. end
  4561. else
  4562. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14));
  4563. end;
  4564. function tthumb2cgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  4565. var
  4566. tmpreg : tregister;
  4567. tmpref : treference;
  4568. l : tasmlabel;
  4569. begin
  4570. tmpreg:=NR_NO;
  4571. { Be sure to have a base register }
  4572. if (ref.base=NR_NO) then
  4573. begin
  4574. if ref.shiftmode<>SM_None then
  4575. internalerror(2014020706);
  4576. ref.base:=ref.index;
  4577. ref.index:=NR_NO;
  4578. end;
  4579. { absolute symbols can't be handled directly, we've to store the symbol reference
  4580. in the text segment and access it pc relative
  4581. For now, we assume that references where base or index equals to PC are already
  4582. relative, all other references are assumed to be absolute and thus they need
  4583. to be handled extra.
  4584. A proper solution would be to change refoptions to a set and store the information
  4585. if the symbol is absolute or relative there.
  4586. }
  4587. if (assigned(ref.symbol) and
  4588. not(is_pc(ref.base)) and
  4589. not(is_pc(ref.index))
  4590. ) or
  4591. { [#xxx] isn't a valid address operand }
  4592. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  4593. //(ref.offset<-4095) or
  4594. (ref.offset<-255) or
  4595. (ref.offset>4095) or
  4596. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  4597. ((ref.offset<-255) or
  4598. (ref.offset>255)
  4599. )
  4600. ) or
  4601. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  4602. ((ref.offset<-1020) or
  4603. (ref.offset>1020) or
  4604. ((abs(ref.offset) mod 4)<>0) or
  4605. { the usual pc relative symbol handling assumes possible offsets of +/- 4095 }
  4606. assigned(ref.symbol)
  4607. )
  4608. ) then
  4609. begin
  4610. reference_reset(tmpref,4,[]);
  4611. { load symbol }
  4612. tmpreg:=getintregister(list,OS_INT);
  4613. if assigned(ref.symbol) then
  4614. begin
  4615. current_asmdata.getjumplabel(l);
  4616. cg.a_label(current_procinfo.aktlocaldata,l);
  4617. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  4618. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset));
  4619. { load consts entry }
  4620. tmpref.symbol:=l;
  4621. tmpref.base:=NR_R15;
  4622. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  4623. { in case of LDF/STF, we got rid of the NR_R15 }
  4624. if is_pc(ref.base) then
  4625. ref.base:=NR_NO;
  4626. if is_pc(ref.index) then
  4627. ref.index:=NR_NO;
  4628. end
  4629. else
  4630. a_load_const_reg(list,OS_ADDR,ref.offset,tmpreg);
  4631. if (ref.base<>NR_NO) then
  4632. begin
  4633. if ref.index<>NR_NO then
  4634. begin
  4635. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4636. ref.base:=tmpreg;
  4637. end
  4638. else
  4639. begin
  4640. ref.index:=tmpreg;
  4641. ref.shiftimm:=0;
  4642. ref.signindex:=1;
  4643. ref.shiftmode:=SM_None;
  4644. end;
  4645. end
  4646. else
  4647. ref.base:=tmpreg;
  4648. ref.offset:=0;
  4649. ref.symbol:=nil;
  4650. end;
  4651. if (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  4652. begin
  4653. if tmpreg<>NR_NO then
  4654. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg,tmpreg)
  4655. else
  4656. begin
  4657. tmpreg:=getintregister(list,OS_ADDR);
  4658. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg);
  4659. ref.base:=tmpreg;
  4660. end;
  4661. ref.offset:=0;
  4662. end;
  4663. { Hack? Thumb2 doesn't allow PC indexed addressing modes(although it does in the specification) }
  4664. if (ref.base=NR_R15) and (ref.index<>NR_NO) and (ref.shiftmode <> sm_none) then
  4665. begin
  4666. tmpreg:=getintregister(list,OS_ADDR);
  4667. list.concat(taicpu.op_reg_reg(A_MOV, tmpreg, NR_R15));
  4668. ref.base := tmpreg;
  4669. end;
  4670. { floating point operations have only limited references
  4671. we expect here, that a base is already set }
  4672. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  4673. begin
  4674. if ref.shiftmode<>SM_none then
  4675. internalerror(200309121);
  4676. if tmpreg<>NR_NO then
  4677. begin
  4678. if ref.base=tmpreg then
  4679. begin
  4680. if ref.signindex<0 then
  4681. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,tmpreg,ref.index))
  4682. else
  4683. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,tmpreg,ref.index));
  4684. ref.index:=NR_NO;
  4685. end
  4686. else
  4687. begin
  4688. if ref.index<>tmpreg then
  4689. internalerror(200403161);
  4690. if ref.signindex<0 then
  4691. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,ref.base,tmpreg))
  4692. else
  4693. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4694. ref.base:=tmpreg;
  4695. ref.index:=NR_NO;
  4696. end;
  4697. end
  4698. else
  4699. begin
  4700. tmpreg:=getintregister(list,OS_ADDR);
  4701. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));
  4702. ref.base:=tmpreg;
  4703. ref.index:=NR_NO;
  4704. end;
  4705. end;
  4706. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  4707. Result := ref;
  4708. end;
  4709. procedure tthumb2cgarm.a_loadmm_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister; shuffle: pmmshuffle);
  4710. var
  4711. instr: taicpu;
  4712. begin
  4713. if (fromsize=OS_F32) and
  4714. (tosize=OS_F32) then
  4715. begin
  4716. instr:=setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32);
  4717. list.Concat(instr);
  4718. add_move_instruction(instr);
  4719. end
  4720. else if (fromsize=OS_F64) and
  4721. (tosize=OS_F64) then
  4722. begin
  4723. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,tregister(longint(reg2)+1),tregister(longint(reg1)+1)), PF_F32));
  4724. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32));
  4725. end
  4726. else if (fromsize=OS_F32) and
  4727. (tosize=OS_F64) then
  4728. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VCVT,reg2,reg1), PF_F32))
  4729. begin
  4730. //list.concat(nil);
  4731. end;
  4732. end;
  4733. procedure tthumb2cgarm.a_loadmm_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  4734. begin
  4735. handle_load_store(list,A_VLDR,PF_None,reg,ref);
  4736. end;
  4737. procedure tthumb2cgarm.a_loadmm_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  4738. begin
  4739. handle_load_store(list,A_VSTR,PF_None,reg,ref);
  4740. end;
  4741. procedure tthumb2cgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize: tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  4742. begin
  4743. if //(shuffle=nil) and
  4744. (tosize=OS_F32) then
  4745. list.Concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg))
  4746. else
  4747. internalerror(2012100813);
  4748. end;
  4749. procedure tthumb2cgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize: tcgsize; mmreg, intreg: tregister; shuffle: pmmshuffle);
  4750. begin
  4751. if //(shuffle=nil) and
  4752. (fromsize=OS_F32) then
  4753. list.Concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg))
  4754. else
  4755. internalerror(2012100814);
  4756. end;
  4757. procedure tthumb2cg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  4758. var tmpreg: tregister;
  4759. begin
  4760. case op of
  4761. OP_NEG:
  4762. begin
  4763. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4764. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  4765. tmpreg:=cg.getintregister(list,OS_32);
  4766. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,0));
  4767. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,tmpreg,regsrc.reghi));
  4768. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4769. end;
  4770. else
  4771. inherited a_op64_reg_reg(list, op, size, regsrc, regdst);
  4772. end;
  4773. end;
  4774. procedure tthumbcg64farm.a_op64_reg_reg(list: TAsmList; op: TOpCG; size: tcgsize; regsrc, regdst: tregister64);
  4775. begin
  4776. case op of
  4777. OP_NEG:
  4778. begin
  4779. list.concat(taicpu.op_reg_const(A_MOV,regdst.reglo,0));
  4780. list.concat(taicpu.op_reg_const(A_MOV,regdst.reghi,0));
  4781. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4782. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4783. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4784. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4785. end;
  4786. OP_NOT:
  4787. begin
  4788. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  4789. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  4790. end;
  4791. OP_AND,OP_OR,OP_XOR:
  4792. begin
  4793. cg.a_op_reg_reg(list,op,OS_32,regsrc.reglo,regdst.reglo);
  4794. cg.a_op_reg_reg(list,op,OS_32,regsrc.reghi,regdst.reghi);
  4795. end;
  4796. OP_ADD:
  4797. begin
  4798. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4799. list.concat(taicpu.op_reg_reg(A_ADD,regdst.reglo,regsrc.reglo));
  4800. list.concat(taicpu.op_reg_reg(A_ADC,regdst.reghi,regsrc.reghi));
  4801. end;
  4802. OP_SUB:
  4803. begin
  4804. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4805. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4806. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4807. end;
  4808. else
  4809. internalerror(2003083101);
  4810. end;
  4811. end;
  4812. procedure tthumbcg64farm.a_op64_const_reg(list: TAsmList; op: TOpCG; size: tcgsize; value: int64; reg: tregister64);
  4813. var
  4814. tmpreg : tregister;
  4815. begin
  4816. case op of
  4817. OP_AND,OP_OR,OP_XOR:
  4818. begin
  4819. cg.a_op_const_reg(list,op,OS_32,aint(lo(value)),reg.reglo);
  4820. cg.a_op_const_reg(list,op,OS_32,aint(hi(value)),reg.reghi);
  4821. end;
  4822. OP_ADD:
  4823. begin
  4824. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4825. begin
  4826. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4827. list.concat(taicpu.op_reg_const(A_ADD,reg.reglo,aint(lo(value))));
  4828. end
  4829. else
  4830. begin
  4831. tmpreg:=cg.getintregister(list,OS_32);
  4832. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4833. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4834. list.concat(taicpu.op_reg_reg(A_ADD,reg.reglo,tmpreg));
  4835. end;
  4836. tmpreg:=cg.getintregister(list,OS_32);
  4837. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  4838. list.concat(taicpu.op_reg_reg(A_ADC,reg.reghi,tmpreg));
  4839. end;
  4840. OP_SUB:
  4841. begin
  4842. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4843. begin
  4844. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4845. list.concat(taicpu.op_reg_const(A_SUB,reg.reglo,aint(lo(value))))
  4846. end
  4847. else
  4848. begin
  4849. tmpreg:=cg.getintregister(list,OS_32);
  4850. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4851. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4852. list.concat(taicpu.op_reg_reg(A_SUB,reg.reglo,tmpreg));
  4853. end;
  4854. tmpreg:=cg.getintregister(list,OS_32);
  4855. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  4856. list.concat(taicpu.op_reg_reg(A_SBC,reg.reghi,tmpreg));
  4857. end;
  4858. else
  4859. internalerror(2003083101);
  4860. end;
  4861. end;
  4862. procedure create_codegen;
  4863. begin
  4864. if GenerateThumb2Code then
  4865. begin
  4866. cg:=tthumb2cgarm.create;
  4867. cg64:=tthumb2cg64farm.create;
  4868. casmoptimizer:=TCpuThumb2AsmOptimizer;
  4869. end
  4870. else if GenerateThumbCode then
  4871. begin
  4872. cg:=tthumbcgarm.create;
  4873. cg64:=tthumbcg64farm.create;
  4874. // casmoptimizer:=TCpuThumbAsmOptimizer;
  4875. end
  4876. else
  4877. begin
  4878. cg:=tarmcgarm.create;
  4879. cg64:=tarmcg64farm.create;
  4880. casmoptimizer:=TCpuAsmOptimizer;
  4881. end;
  4882. end;
  4883. end.