cgcpu.pas 200 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228322932303231323232333234323532363237323832393240324132423243324432453246324732483249325032513252325332543255325632573258325932603261326232633264326532663267326832693270327132723273327432753276327732783279328032813282328332843285328632873288328932903291329232933294329532963297329832993300330133023303330433053306330733083309331033113312331333143315331633173318331933203321332233233324332533263327332833293330333133323333333433353336333733383339334033413342334333443345334633473348334933503351335233533354335533563357335833593360336133623363336433653366336733683369337033713372337333743375337633773378337933803381338233833384338533863387338833893390339133923393339433953396339733983399340034013402340334043405340634073408340934103411341234133414341534163417341834193420342134223423342434253426342734283429343034313432343334343435343634373438343934403441344234433444344534463447344834493450345134523453345434553456345734583459346034613462346334643465346634673468346934703471347234733474347534763477347834793480348134823483348434853486348734883489349034913492349334943495349634973498349935003501350235033504350535063507350835093510351135123513351435153516351735183519352035213522352335243525352635273528352935303531353235333534353535363537353835393540354135423543354435453546354735483549355035513552355335543555355635573558355935603561356235633564356535663567356835693570357135723573357435753576357735783579358035813582358335843585358635873588358935903591359235933594359535963597359835993600360136023603360436053606360736083609361036113612361336143615361636173618361936203621362236233624362536263627362836293630363136323633363436353636363736383639364036413642364336443645364636473648364936503651365236533654365536563657365836593660366136623663366436653666366736683669367036713672367336743675367636773678367936803681368236833684368536863687368836893690369136923693369436953696369736983699370037013702370337043705370637073708370937103711371237133714371537163717371837193720372137223723372437253726372737283729373037313732373337343735373637373738373937403741374237433744374537463747374837493750375137523753375437553756375737583759376037613762376337643765376637673768376937703771377237733774377537763777377837793780378137823783378437853786378737883789379037913792379337943795379637973798379938003801380238033804380538063807380838093810381138123813381438153816381738183819382038213822382338243825382638273828382938303831383238333834383538363837383838393840384138423843384438453846384738483849385038513852385338543855385638573858385938603861386238633864386538663867386838693870387138723873387438753876387738783879388038813882388338843885388638873888388938903891389238933894389538963897389838993900390139023903390439053906390739083909391039113912391339143915391639173918391939203921392239233924392539263927392839293930393139323933393439353936393739383939394039413942394339443945394639473948394939503951395239533954395539563957395839593960396139623963396439653966396739683969397039713972397339743975397639773978397939803981398239833984398539863987398839893990399139923993399439953996399739983999400040014002400340044005400640074008400940104011401240134014401540164017401840194020402140224023402440254026402740284029403040314032403340344035403640374038403940404041404240434044404540464047404840494050405140524053405440554056405740584059406040614062406340644065406640674068406940704071407240734074407540764077407840794080408140824083408440854086408740884089409040914092409340944095409640974098409941004101410241034104410541064107410841094110411141124113411441154116411741184119412041214122412341244125412641274128412941304131413241334134413541364137413841394140414141424143414441454146414741484149415041514152415341544155415641574158415941604161416241634164416541664167416841694170417141724173417441754176417741784179418041814182418341844185418641874188418941904191419241934194419541964197419841994200420142024203420442054206420742084209421042114212421342144215421642174218421942204221422242234224422542264227422842294230423142324233423442354236423742384239424042414242424342444245424642474248424942504251425242534254425542564257425842594260426142624263426442654266426742684269427042714272427342744275427642774278427942804281428242834284428542864287428842894290429142924293429442954296429742984299430043014302430343044305430643074308430943104311431243134314431543164317431843194320432143224323432443254326432743284329433043314332433343344335433643374338433943404341434243434344434543464347434843494350435143524353435443554356435743584359436043614362436343644365436643674368436943704371437243734374437543764377437843794380438143824383438443854386438743884389439043914392439343944395439643974398439944004401440244034404440544064407440844094410441144124413441444154416441744184419442044214422442344244425442644274428442944304431443244334434443544364437443844394440444144424443444444454446444744484449445044514452445344544455445644574458445944604461446244634464446544664467446844694470447144724473447444754476447744784479448044814482448344844485448644874488448944904491449244934494449544964497449844994500450145024503450445054506450745084509451045114512451345144515451645174518451945204521452245234524452545264527452845294530453145324533453445354536453745384539454045414542454345444545454645474548454945504551455245534554455545564557455845594560456145624563456445654566456745684569457045714572457345744575457645774578457945804581458245834584458545864587458845894590459145924593459445954596459745984599460046014602460346044605460646074608460946104611461246134614461546164617461846194620462146224623462446254626462746284629463046314632463346344635463646374638463946404641464246434644464546464647464846494650465146524653465446554656465746584659466046614662466346644665466646674668466946704671467246734674467546764677467846794680468146824683468446854686468746884689469046914692469346944695469646974698469947004701470247034704470547064707470847094710471147124713471447154716471747184719472047214722472347244725472647274728472947304731473247334734473547364737473847394740474147424743474447454746474747484749475047514752475347544755475647574758475947604761476247634764476547664767476847694770477147724773477447754776477747784779478047814782478347844785478647874788478947904791479247934794479547964797479847994800480148024803480448054806480748084809481048114812481348144815481648174818481948204821482248234824482548264827482848294830483148324833483448354836483748384839484048414842484348444845484648474848484948504851485248534854485548564857485848594860486148624863486448654866486748684869487048714872487348744875487648774878487948804881488248834884488548864887488848894890489148924893489448954896489748984899490049014902490349044905490649074908490949104911491249134914491549164917491849194920492149224923492449254926492749284929493049314932493349344935493649374938493949404941494249434944494549464947494849494950495149524953495449554956495749584959496049614962496349644965496649674968496949704971497249734974497549764977497849794980498149824983498449854986498749884989499049914992499349944995499649974998499950005001500250035004500550065007500850095010
  1. {
  2. Copyright (c) 2003 by Florian Klaempfl
  3. Member of the Free Pascal development team
  4. This unit implements the code generator for the ARM
  5. This program is free software; you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation; either version 2 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program; if not, write to the Free Software
  15. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  16. ****************************************************************************
  17. }
  18. unit cgcpu;
  19. {$i fpcdefs.inc}
  20. interface
  21. uses
  22. globtype,symtype,symdef,
  23. cgbase,cgutils,cgobj,
  24. aasmbase,aasmcpu,aasmtai,aasmdata,
  25. parabase,
  26. cpubase,cpuinfo,cg64f32,rgcpu;
  27. type
  28. { tbasecgarm is shared between all arm architectures }
  29. tbasecgarm = class(tcg)
  30. { true, if the next arithmetic operation should modify the flags }
  31. cgsetflags : boolean;
  32. procedure a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);override;
  33. procedure a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);override;
  34. procedure a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);override;
  35. procedure a_call_name(list : TAsmList;const s : string; weak: boolean);override;
  36. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  37. procedure a_call_ref(list : TAsmList;ref: treference);override;
  38. { move instructions }
  39. procedure a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);override;
  40. procedure a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);override;
  41. function a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  42. function a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  43. { fpu move instructions }
  44. procedure a_loadfpu_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister); override;
  45. procedure a_loadfpu_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister); override;
  46. procedure a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference); override;
  47. procedure a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);override;
  48. { comparison operations }
  49. procedure a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  50. l : tasmlabel);override;
  51. procedure a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel); override;
  52. procedure a_jmp_name(list : TAsmList;const s : string); override;
  53. procedure a_jmp_always(list : TAsmList;l: tasmlabel); override;
  54. procedure a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel); override;
  55. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  56. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  57. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  58. procedure a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);override;
  59. procedure g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);override;
  60. procedure g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);override;
  61. procedure g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  62. procedure g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  63. procedure g_overflowcheck(list: TAsmList; const l: tlocation; def: tdef); override;
  64. procedure g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);override;
  65. procedure g_save_registers(list : TAsmList);override;
  66. procedure g_restore_registers(list : TAsmList);override;
  67. procedure a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  68. procedure fixref(list : TAsmList;var ref : treference);
  69. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; virtual;
  70. procedure g_intf_wrapper(list: TAsmList; procdef: tprocdef; const labelname: string; ioffset: longint);override;
  71. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  72. procedure g_stackpointer_alloc(list : TAsmList;size : longint);override;
  73. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  74. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  75. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  76. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  77. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  78. procedure a_opmm_reg_reg(list: TAsmList; Op: TOpCG; size : tcgsize;src,dst: tregister;shuffle : pmmshuffle); override;
  79. { Transform unsupported methods into Internal errors }
  80. procedure a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; size: TCGSize; src, dst: TRegister); override;
  81. { try to generate optimized 32 Bit multiplication, returns true if successful generated }
  82. function try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  83. { clear out potential overflow bits from 8 or 16 bit operations }
  84. { the upper 24/16 bits of a register after an operation }
  85. procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  86. function get_darwin_call_stub(const s: string; weak: boolean): tasmsymbol;
  87. end;
  88. { tcgarm is shared between normal arm and thumb-2 }
  89. tcgarm = class(tbasecgarm)
  90. procedure a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister); override;
  91. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  92. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  93. size: tcgsize; a: tcgint; src, dst: tregister); override;
  94. procedure a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  95. size: tcgsize; src1, src2, dst: tregister); override;
  96. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  97. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  98. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  99. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  100. end;
  101. { normal arm cg }
  102. tarmcgarm = class(tcgarm)
  103. procedure init_register_allocators;override;
  104. procedure done_register_allocators;override;
  105. end;
  106. { 64 bit cg for all arm flavours }
  107. tbasecg64farm = class(tcg64f32)
  108. end;
  109. { tcg64farm is shared between normal arm and thumb-2 }
  110. tcg64farm = class(tbasecg64farm)
  111. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  112. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  113. procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;
  114. procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  115. procedure a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  116. procedure a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  117. procedure a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);override;
  118. procedure a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);override;
  119. end;
  120. tarmcg64farm = class(tcg64farm)
  121. end;
  122. tthumbcgarm = class(tbasecgarm)
  123. procedure init_register_allocators;override;
  124. procedure done_register_allocators;override;
  125. procedure g_proc_entry(list: TAsmList; localsize: longint; nostackframe: boolean);override;
  126. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  127. procedure a_op_reg_reg(list: TAsmList; Op: TOpCG; size: TCGSize; src,dst: TRegister);override;
  128. procedure a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);override;
  129. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  130. procedure a_load_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const Ref: treference; reg: tregister);override;
  131. procedure a_load_const_reg(list: TAsmList; size: tcgsize; a: tcgint; reg: tregister);override;
  132. end;
  133. tthumbcg64farm = class(tbasecg64farm)
  134. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  135. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  136. end;
  137. tthumb2cgarm = class(tcgarm)
  138. procedure init_register_allocators;override;
  139. procedure done_register_allocators;override;
  140. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  141. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  142. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  143. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  144. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  145. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  146. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  147. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  148. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  149. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; override;
  150. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  151. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  152. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  153. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  154. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  155. end;
  156. tthumb2cg64farm = class(tcg64farm)
  157. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  158. end;
  159. const
  160. OpCmp2AsmCond : Array[topcmp] of TAsmCond = (C_NONE,C_EQ,C_GT,
  161. C_LT,C_GE,C_LE,C_NE,C_LS,C_CC,C_CS,C_HI);
  162. winstackpagesize = 4096;
  163. function get_fpu_postfix(def : tdef) : toppostfix;
  164. procedure create_codegen;
  165. implementation
  166. uses
  167. globals,verbose,systems,cutils,
  168. aopt,aoptcpu,
  169. fmodule,
  170. symconst,symsym,symtable,
  171. tgobj,
  172. procinfo,cpupi,
  173. paramgr;
  174. function get_fpu_postfix(def : tdef) : toppostfix;
  175. begin
  176. if def.typ=floatdef then
  177. begin
  178. case tfloatdef(def).floattype of
  179. s32real:
  180. result:=PF_S;
  181. s64real:
  182. result:=PF_D;
  183. s80real:
  184. result:=PF_E;
  185. else
  186. internalerror(200401272);
  187. end;
  188. end
  189. else
  190. internalerror(200401271);
  191. end;
  192. procedure tarmcgarm.init_register_allocators;
  193. begin
  194. inherited init_register_allocators;
  195. { currently, we always save R14, so we can use it }
  196. if (target_info.system<>system_arm_darwin) then
  197. begin
  198. if assigned(current_procinfo) and (current_procinfo.framepointer<>NR_R11) then
  199. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  200. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  201. RS_R9,RS_R10,RS_R11,RS_R14],first_int_imreg,[])
  202. else
  203. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  204. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  205. RS_R9,RS_R10,RS_R14],first_int_imreg,[])
  206. end
  207. else
  208. { r7 is not available on Darwin, it's used as frame pointer (always,
  209. for backtrace support -- also in gcc/clang -> R11 can be used).
  210. r9 is volatile }
  211. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  212. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R9,RS_R12,RS_R4,RS_R5,RS_R6,RS_R8,
  213. RS_R10,RS_R11,RS_R14],first_int_imreg,[]);
  214. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  215. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  216. { The register allocator currently cannot deal with multiple
  217. non-overlapping subregs per register, so we can only use
  218. half the single precision registers for now (as sub registers of the
  219. double precision ones). }
  220. if current_settings.fputype=fpu_vfpv3 then
  221. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  222. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  223. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  224. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  225. ],first_mm_imreg,[])
  226. else
  227. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  228. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15],first_mm_imreg,[]);
  229. end;
  230. procedure tarmcgarm.done_register_allocators;
  231. begin
  232. rg[R_INTREGISTER].free;
  233. rg[R_FPUREGISTER].free;
  234. rg[R_MMREGISTER].free;
  235. inherited done_register_allocators;
  236. end;
  237. procedure tcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  238. var
  239. imm_shift : byte;
  240. l : tasmlabel;
  241. hr : treference;
  242. imm1, imm2: DWord;
  243. begin
  244. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  245. internalerror(2002090902);
  246. if is_shifter_const(a,imm_shift) then
  247. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  248. else if is_shifter_const(not(a),imm_shift) then
  249. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  250. { loading of constants with mov and orr }
  251. else if (split_into_shifter_const(a,imm1, imm2)) then
  252. begin
  253. list.concat(taicpu.op_reg_const(A_MOV,reg, imm1));
  254. list.concat(taicpu.op_reg_reg_const(A_ORR,reg,reg, imm2));
  255. end
  256. { loading of constants with mvn and bic }
  257. else if (split_into_shifter_const(not(a), imm1, imm2)) then
  258. begin
  259. list.concat(taicpu.op_reg_const(A_MVN,reg, imm1));
  260. list.concat(taicpu.op_reg_reg_const(A_BIC,reg,reg, imm2));
  261. end
  262. else
  263. begin
  264. reference_reset(hr,4);
  265. current_asmdata.getjumplabel(l);
  266. cg.a_label(current_procinfo.aktlocaldata,l);
  267. hr.symboldata:=current_procinfo.aktlocaldata.last;
  268. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  269. hr.symbol:=l;
  270. hr.base:=NR_PC;
  271. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  272. end;
  273. end;
  274. procedure tcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  275. var
  276. oppostfix:toppostfix;
  277. usedtmpref: treference;
  278. tmpreg,tmpreg2 : tregister;
  279. so : tshifterop;
  280. dir : integer;
  281. begin
  282. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  283. FromSize := ToSize;
  284. case FromSize of
  285. { signed integer registers }
  286. OS_8:
  287. oppostfix:=PF_B;
  288. OS_S8:
  289. oppostfix:=PF_SB;
  290. OS_16:
  291. oppostfix:=PF_H;
  292. OS_S16:
  293. oppostfix:=PF_SH;
  294. OS_32,
  295. OS_S32:
  296. oppostfix:=PF_None;
  297. else
  298. InternalError(200308297);
  299. end;
  300. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  301. begin
  302. if target_info.endian=endian_big then
  303. dir:=-1
  304. else
  305. dir:=1;
  306. case FromSize of
  307. OS_16,OS_S16:
  308. begin
  309. { only complicated references need an extra loadaddr }
  310. if assigned(ref.symbol) or
  311. (ref.index<>NR_NO) or
  312. (ref.offset<-4095) or
  313. (ref.offset>4094) or
  314. { sometimes the compiler reused registers }
  315. (reg=ref.index) or
  316. (reg=ref.base) then
  317. begin
  318. tmpreg2:=getintregister(list,OS_INT);
  319. a_loadaddr_ref_reg(list,ref,tmpreg2);
  320. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  321. end
  322. else
  323. usedtmpref:=ref;
  324. if target_info.endian=endian_big then
  325. inc(usedtmpref.offset,1);
  326. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  327. tmpreg:=getintregister(list,OS_INT);
  328. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  329. inc(usedtmpref.offset,dir);
  330. if FromSize=OS_16 then
  331. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  332. else
  333. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  334. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  335. end;
  336. OS_32,OS_S32:
  337. begin
  338. tmpreg:=getintregister(list,OS_INT);
  339. { only complicated references need an extra loadaddr }
  340. if assigned(ref.symbol) or
  341. (ref.index<>NR_NO) or
  342. (ref.offset<-4095) or
  343. (ref.offset>4092) or
  344. { sometimes the compiler reused registers }
  345. (reg=ref.index) or
  346. (reg=ref.base) then
  347. begin
  348. tmpreg2:=getintregister(list,OS_INT);
  349. a_loadaddr_ref_reg(list,ref,tmpreg2);
  350. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  351. end
  352. else
  353. usedtmpref:=ref;
  354. shifterop_reset(so);so.shiftmode:=SM_LSL;
  355. if ref.alignment=2 then
  356. begin
  357. if target_info.endian=endian_big then
  358. inc(usedtmpref.offset,2);
  359. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  360. inc(usedtmpref.offset,dir*2);
  361. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  362. so.shiftimm:=16;
  363. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  364. end
  365. else
  366. begin
  367. tmpreg2:=getintregister(list,OS_INT);
  368. if target_info.endian=endian_big then
  369. inc(usedtmpref.offset,3);
  370. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  371. inc(usedtmpref.offset,dir);
  372. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  373. inc(usedtmpref.offset,dir);
  374. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg2);
  375. so.shiftimm:=8;
  376. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  377. inc(usedtmpref.offset,dir);
  378. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  379. so.shiftimm:=16;
  380. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg2,so));
  381. so.shiftimm:=24;
  382. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  383. end;
  384. end
  385. else
  386. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  387. end;
  388. end
  389. else
  390. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  391. if (fromsize=OS_S8) and (tosize = OS_16) then
  392. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  393. end;
  394. procedure tbasecgarm.a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);
  395. var
  396. ref: treference;
  397. begin
  398. paraloc.check_simple_location;
  399. paramanager.allocparaloc(list,paraloc.location);
  400. case paraloc.location^.loc of
  401. LOC_REGISTER,LOC_CREGISTER:
  402. a_load_const_reg(list,size,a,paraloc.location^.register);
  403. LOC_REFERENCE:
  404. begin
  405. reference_reset(ref,paraloc.alignment);
  406. ref.base:=paraloc.location^.reference.index;
  407. ref.offset:=paraloc.location^.reference.offset;
  408. a_load_const_ref(list,size,a,ref);
  409. end;
  410. else
  411. internalerror(2002081101);
  412. end;
  413. end;
  414. procedure tbasecgarm.a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);
  415. var
  416. tmpref, ref: treference;
  417. location: pcgparalocation;
  418. sizeleft: aint;
  419. begin
  420. location := paraloc.location;
  421. tmpref := r;
  422. sizeleft := paraloc.intsize;
  423. while assigned(location) do
  424. begin
  425. paramanager.allocparaloc(list,location);
  426. case location^.loc of
  427. LOC_REGISTER,LOC_CREGISTER:
  428. a_load_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  429. LOC_REFERENCE:
  430. begin
  431. reference_reset_base(ref,location^.reference.index,location^.reference.offset,paraloc.alignment);
  432. { doubles in softemu mode have a strange order of registers and references }
  433. if location^.size=OS_32 then
  434. g_concatcopy(list,tmpref,ref,4)
  435. else
  436. begin
  437. g_concatcopy(list,tmpref,ref,sizeleft);
  438. if assigned(location^.next) then
  439. internalerror(2005010710);
  440. end;
  441. end;
  442. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  443. case location^.size of
  444. OS_F32, OS_F64:
  445. a_loadfpu_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  446. else
  447. internalerror(2002072801);
  448. end;
  449. LOC_VOID:
  450. begin
  451. // nothing to do
  452. end;
  453. else
  454. internalerror(2002081103);
  455. end;
  456. inc(tmpref.offset,tcgsize2size[location^.size]);
  457. dec(sizeleft,tcgsize2size[location^.size]);
  458. location := location^.next;
  459. end;
  460. end;
  461. procedure tbasecgarm.a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);
  462. var
  463. ref: treference;
  464. tmpreg: tregister;
  465. begin
  466. paraloc.check_simple_location;
  467. paramanager.allocparaloc(list,paraloc.location);
  468. case paraloc.location^.loc of
  469. LOC_REGISTER,LOC_CREGISTER:
  470. a_loadaddr_ref_reg(list,r,paraloc.location^.register);
  471. LOC_REFERENCE:
  472. begin
  473. reference_reset(ref,paraloc.alignment);
  474. ref.base := paraloc.location^.reference.index;
  475. ref.offset := paraloc.location^.reference.offset;
  476. tmpreg := getintregister(list,OS_ADDR);
  477. a_loadaddr_ref_reg(list,r,tmpreg);
  478. a_load_reg_ref(list,OS_ADDR,OS_ADDR,tmpreg,ref);
  479. end;
  480. else
  481. internalerror(2002080701);
  482. end;
  483. end;
  484. procedure tbasecgarm.a_call_name(list : TAsmList;const s : string; weak: boolean);
  485. var
  486. branchopcode: tasmop;
  487. begin
  488. { check not really correct: should only be used for non-Thumb cpus }
  489. if CPUARM_HAS_BLX_LABEL in cpu_capabilities[current_settings.cputype] then
  490. branchopcode:=A_BLX
  491. else
  492. branchopcode:=A_BL;
  493. if target_info.system<>system_arm_darwin then
  494. if not weak then
  495. list.concat(taicpu.op_sym(branchopcode,current_asmdata.RefAsmSymbol(s)))
  496. else
  497. list.concat(taicpu.op_sym(branchopcode,current_asmdata.WeakRefAsmSymbol(s)))
  498. else
  499. list.concat(taicpu.op_sym(branchopcode,get_darwin_call_stub(s,weak)));
  500. {
  501. the compiler does not properly set this flag anymore in pass 1, and
  502. for now we only need it after pass 2 (I hope) (JM)
  503. if not(pi_do_call in current_procinfo.flags) then
  504. internalerror(2003060703);
  505. }
  506. include(current_procinfo.flags,pi_do_call);
  507. end;
  508. procedure tbasecgarm.a_call_reg(list : TAsmList;reg: tregister);
  509. begin
  510. { check not really correct: should only be used for non-Thumb cpus }
  511. if not(CPUARM_HAS_BLX in cpu_capabilities[current_settings.cputype]) then
  512. begin
  513. list.concat(taicpu.op_reg_reg(A_MOV,NR_R14,NR_PC));
  514. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,reg));
  515. end
  516. else
  517. list.concat(taicpu.op_reg(A_BLX, reg));
  518. {
  519. the compiler does not properly set this flag anymore in pass 1, and
  520. for now we only need it after pass 2 (I hope) (JM)
  521. if not(pi_do_call in current_procinfo.flags) then
  522. internalerror(2003060703);
  523. }
  524. include(current_procinfo.flags,pi_do_call);
  525. end;
  526. procedure tbasecgarm.a_call_ref(list : TAsmList;ref: treference);
  527. begin
  528. a_reg_alloc(list,NR_R12);
  529. a_load_ref_reg(list,OS_ADDR,OS_ADDR,ref,NR_R12);
  530. a_call_reg(list,NR_R12);
  531. a_reg_dealloc(list,NR_R12);
  532. include(current_procinfo.flags,pi_do_call);
  533. end;
  534. procedure tcgarm.a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister);
  535. begin
  536. a_op_const_reg_reg(list,op,size,a,reg,reg);
  537. end;
  538. procedure tcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  539. var
  540. so : tshifterop;
  541. begin
  542. if op = OP_NEG then
  543. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,src,0))
  544. else if op = OP_NOT then
  545. begin
  546. if size in [OS_8, OS_16, OS_S8, OS_S16] then
  547. begin
  548. shifterop_reset(so);
  549. so.shiftmode:=SM_LSL;
  550. if size in [OS_8, OS_S8] then
  551. so.shiftimm:=24
  552. else
  553. so.shiftimm:=16;
  554. list.concat(taicpu.op_reg_reg_shifterop(A_MVN,dst,src,so));
  555. {Using a shift here allows this to be folded into another instruction}
  556. if size in [OS_S8, OS_S16] then
  557. so.shiftmode:=SM_ASR
  558. else
  559. so.shiftmode:=SM_LSR;
  560. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  561. end
  562. else
  563. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  564. end
  565. else
  566. a_op_reg_reg_reg(list,op,OS_32,src,dst,dst);
  567. end;
  568. const
  569. op_reg_reg_opcg2asmop: array[TOpCG] of tasmop =
  570. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  571. A_NONE,A_NONE,A_NONE,A_SUB,A_EOR,A_NONE,A_NONE);
  572. op_reg_opcg2asmop: array[TOpCG] of tasmop =
  573. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  574. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  575. op_reg_postfix: array[TOpCG] of TOpPostfix =
  576. (PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,
  577. PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None);
  578. procedure tcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  579. size: tcgsize; a: tcgint; src, dst: tregister);
  580. var
  581. ovloc : tlocation;
  582. begin
  583. a_op_const_reg_reg_checkoverflow(list,op,size,a,src,dst,false,ovloc);
  584. end;
  585. procedure tcgarm.a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  586. size: tcgsize; src1, src2, dst: tregister);
  587. var
  588. ovloc : tlocation;
  589. begin
  590. a_op_reg_reg_reg_checkoverflow(list,op,size,src1,src2,dst,false,ovloc);
  591. end;
  592. function opshift2shiftmode(op: TOpCg): tshiftmode;
  593. begin
  594. case op of
  595. OP_SHL: Result:=SM_LSL;
  596. OP_SHR: Result:=SM_LSR;
  597. OP_ROR: Result:=SM_ROR;
  598. OP_ROL: Result:=SM_ROR;
  599. OP_SAR: Result:=SM_ASR;
  600. else internalerror(2012070501);
  601. end
  602. end;
  603. function tbasecgarm.try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  604. var
  605. multiplier : dword;
  606. power : longint;
  607. shifterop : tshifterop;
  608. bitsset : byte;
  609. negative : boolean;
  610. first : boolean;
  611. b,
  612. cycles : byte;
  613. maxeffort : byte;
  614. begin
  615. result:=true;
  616. cycles:=0;
  617. negative:=a<0;
  618. shifterop.rs:=NR_NO;
  619. shifterop.shiftmode:=SM_LSL;
  620. if negative then
  621. inc(cycles);
  622. multiplier:=dword(abs(a));
  623. bitsset:=popcnt(multiplier and $fffffffe);
  624. { heuristics to estimate how much instructions are reasonable to replace the mul,
  625. this is currently based on XScale timings }
  626. { in the simplest case, we need a mov to load the constant and a mul to carry out the
  627. actual multiplication, this requires min. 1+4 cycles
  628. because the first shift imm. might cause a stall and because we need more instructions
  629. when replacing the mul we generate max. 3 instructions to replace this mul }
  630. maxeffort:=3;
  631. { if the constant is not a shifter op, we need either some mov/mvn/bic/or sequence or
  632. a ldr, so generating one more operation to replace this is beneficial }
  633. if not(is_shifter_const(dword(a),b)) and not(is_shifter_const(not(dword(a)),b)) then
  634. inc(maxeffort);
  635. { if the upper 5 bits are all set or clear, mul is one cycle faster }
  636. if ((dword(a) and $f8000000)=0) or ((dword(a) and $f8000000)=$f8000000) then
  637. dec(maxeffort);
  638. { if the upper 17 bits are all set or clear, mul is another cycle faster }
  639. if ((dword(a) and $ffff8000)=0) or ((dword(a) and $ffff8000)=$ffff8000) then
  640. dec(maxeffort);
  641. { most simple cases }
  642. if a=1 then
  643. a_load_reg_reg(list,OS_32,OS_32,src,dst)
  644. else if a=0 then
  645. a_load_const_reg(list,OS_32,0,dst)
  646. else if a=-1 then
  647. a_op_reg_reg(list,OP_NEG,OS_32,src,dst)
  648. { add up ?
  649. basically, one add is needed for each bit being set in the constant factor
  650. however, the least significant bit is for free, it can be hidden in the initial
  651. instruction
  652. }
  653. else if (bitsset+cycles<=maxeffort) and
  654. (bitsset<=popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)) then
  655. begin
  656. first:=true;
  657. while multiplier<>0 do
  658. begin
  659. shifterop.shiftimm:=BsrDWord(multiplier);
  660. if odd(multiplier) then
  661. begin
  662. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,shifterop));
  663. dec(multiplier);
  664. end
  665. else
  666. if first then
  667. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  668. else
  669. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,src,shifterop));
  670. first:=false;
  671. dec(multiplier,1 shl shifterop.shiftimm);
  672. end;
  673. if negative then
  674. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  675. end
  676. { subtract from the next greater power of two? }
  677. else if popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)+cycles+1<=maxeffort then
  678. begin
  679. first:=true;
  680. while multiplier<>0 do
  681. begin
  682. if first then
  683. begin
  684. multiplier:=(1 shl power)-multiplier;
  685. shifterop.shiftimm:=power;
  686. end
  687. else
  688. shifterop.shiftimm:=BsrDWord(multiplier);
  689. if odd(multiplier) then
  690. begin
  691. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,shifterop));
  692. dec(multiplier);
  693. end
  694. else
  695. if first then
  696. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  697. else
  698. begin
  699. list.concat(taicpu.op_reg_reg_reg_shifterop(A_SUB,dst,dst,src,shifterop));
  700. dec(multiplier,1 shl shifterop.shiftimm);
  701. end;
  702. first:=false;
  703. end;
  704. if negative then
  705. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  706. end
  707. else
  708. result:=false;
  709. end;
  710. procedure tcgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  711. var
  712. shift : byte;
  713. tmpreg : tregister;
  714. so : tshifterop;
  715. l1 : longint;
  716. imm1, imm2: DWord;
  717. begin
  718. ovloc.loc:=LOC_VOID;
  719. if {$ifopt R+}(a<>-2147483648) and{$endif} not setflags and is_shifter_const(-a,shift) then
  720. case op of
  721. OP_ADD:
  722. begin
  723. op:=OP_SUB;
  724. a:=aint(dword(-a));
  725. end;
  726. OP_SUB:
  727. begin
  728. op:=OP_ADD;
  729. a:=aint(dword(-a));
  730. end
  731. end;
  732. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  733. case op of
  734. OP_NEG,OP_NOT:
  735. internalerror(200308281);
  736. OP_SHL,
  737. OP_SHR,
  738. OP_ROL,
  739. OP_ROR,
  740. OP_SAR:
  741. begin
  742. if a>32 then
  743. internalerror(200308294);
  744. if a<>0 then
  745. begin
  746. shifterop_reset(so);
  747. so.shiftmode:=opshift2shiftmode(op);
  748. if op = OP_ROL then
  749. so.shiftimm:=32-a
  750. else
  751. so.shiftimm:=a;
  752. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  753. end
  754. else
  755. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  756. end;
  757. else
  758. {if (op in [OP_SUB, OP_ADD]) and
  759. ((a < 0) or
  760. (a > 4095)) then
  761. begin
  762. tmpreg:=getintregister(list,size);
  763. list.concat(taicpu.op_reg_const(A_MOVT, tmpreg, (a shr 16) and $FFFF));
  764. list.concat(taicpu.op_reg_const(A_MOV, tmpreg, a and $FFFF));
  765. list.concat(setoppostfix(taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))
  766. ));
  767. end
  768. else}
  769. begin
  770. if cgsetflags or setflags then
  771. a_reg_alloc(list,NR_DEFAULTFLAGS);
  772. list.concat(setoppostfix(
  773. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  774. end;
  775. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  776. begin
  777. ovloc.loc:=LOC_FLAGS;
  778. case op of
  779. OP_ADD:
  780. ovloc.resflags:=F_CS;
  781. OP_SUB:
  782. ovloc.resflags:=F_CC;
  783. end;
  784. end;
  785. end
  786. else
  787. begin
  788. { there could be added some more sophisticated optimizations }
  789. if (op in [OP_MUL,OP_IMUL,OP_DIV,OP_IDIV]) and (a=1) then
  790. a_load_reg_reg(list,size,size,src,dst)
  791. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  792. a_load_const_reg(list,size,0,dst)
  793. else if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  794. a_op_reg_reg(list,OP_NEG,size,src,dst)
  795. { we do this here instead in the peephole optimizer because
  796. it saves us a register }
  797. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  798. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  799. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  800. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  801. begin
  802. if l1>32 then{roozbeh does this ever happen?}
  803. internalerror(200308296);
  804. shifterop_reset(so);
  805. so.shiftmode:=SM_LSL;
  806. so.shiftimm:=l1;
  807. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  808. end
  809. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  810. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  811. begin
  812. if l1>32 then{does this ever happen?}
  813. internalerror(201205181);
  814. shifterop_reset(so);
  815. so.shiftmode:=SM_LSL;
  816. so.shiftimm:=l1;
  817. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  818. end
  819. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  820. begin
  821. { nothing to do on success }
  822. end
  823. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  824. Just using mov x, #0 might allow some easier optimizations down the line. }
  825. else if (op = OP_AND) and (dword(a)=0) then
  826. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  827. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  828. else if (op = OP_AND) and (not(dword(a))=0) then
  829. list.concat(taicpu.op_reg_reg(A_MOV,dst,src))
  830. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  831. broader range of shifterconstants.}
  832. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  833. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  834. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  835. begin
  836. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,imm1));
  837. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  838. end
  839. else if (op in [OP_ADD, OP_SUB, OP_OR]) and
  840. not(cgsetflags or setflags) and
  841. split_into_shifter_const(a, imm1, imm2) then
  842. begin
  843. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,imm1));
  844. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  845. end
  846. else
  847. begin
  848. tmpreg:=getintregister(list,size);
  849. a_load_const_reg(list,size,a,tmpreg);
  850. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  851. end;
  852. end;
  853. maybeadjustresult(list,op,size,dst);
  854. end;
  855. procedure tcgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  856. var
  857. so : tshifterop;
  858. tmpreg,overflowreg : tregister;
  859. asmop : tasmop;
  860. begin
  861. ovloc.loc:=LOC_VOID;
  862. case op of
  863. OP_NEG,OP_NOT,
  864. OP_DIV,OP_IDIV:
  865. internalerror(200308281);
  866. OP_SHL,
  867. OP_SHR,
  868. OP_SAR,
  869. OP_ROR:
  870. begin
  871. if (op = OP_ROR) and not(size in [OS_32,OS_S32]) then
  872. internalerror(2008072801);
  873. shifterop_reset(so);
  874. so.rs:=src1;
  875. so.shiftmode:=opshift2shiftmode(op);
  876. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  877. end;
  878. OP_ROL:
  879. begin
  880. if not(size in [OS_32,OS_S32]) then
  881. internalerror(2008072801);
  882. { simulate ROL by ror'ing 32-value }
  883. tmpreg:=getintregister(list,OS_32);
  884. list.concat(taicpu.op_reg_reg_const(A_RSB,tmpreg,src1, 32));
  885. shifterop_reset(so);
  886. so.rs:=tmpreg;
  887. so.shiftmode:=SM_ROR;
  888. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  889. end;
  890. OP_IMUL,
  891. OP_MUL:
  892. begin
  893. if cgsetflags or setflags then
  894. begin
  895. overflowreg:=getintregister(list,size);
  896. if op=OP_IMUL then
  897. asmop:=A_SMULL
  898. else
  899. asmop:=A_UMULL;
  900. { the arm doesn't allow that rd and rm are the same }
  901. if dst=src2 then
  902. begin
  903. if dst<>src1 then
  904. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  905. else
  906. begin
  907. tmpreg:=getintregister(list,size);
  908. a_load_reg_reg(list,size,size,src2,dst);
  909. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  910. end;
  911. end
  912. else
  913. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  914. a_reg_alloc(list,NR_DEFAULTFLAGS);
  915. if op=OP_IMUL then
  916. begin
  917. shifterop_reset(so);
  918. so.shiftmode:=SM_ASR;
  919. so.shiftimm:=31;
  920. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  921. end
  922. else
  923. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  924. ovloc.loc:=LOC_FLAGS;
  925. ovloc.resflags:=F_NE;
  926. end
  927. else
  928. begin
  929. { the arm doesn't allow that rd and rm are the same }
  930. if dst=src2 then
  931. begin
  932. if dst<>src1 then
  933. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  934. else
  935. begin
  936. tmpreg:=getintregister(list,size);
  937. a_load_reg_reg(list,size,size,src2,dst);
  938. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  939. end;
  940. end
  941. else
  942. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  943. end;
  944. end;
  945. else
  946. begin
  947. if cgsetflags or setflags then
  948. a_reg_alloc(list,NR_DEFAULTFLAGS);
  949. list.concat(setoppostfix(
  950. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  951. end;
  952. end;
  953. maybeadjustresult(list,op,size,dst);
  954. end;
  955. function tbasecgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  956. var
  957. tmpreg : tregister;
  958. tmpref : treference;
  959. l : tasmlabel;
  960. begin
  961. tmpreg:=NR_NO;
  962. { Be sure to have a base register }
  963. if (ref.base=NR_NO) then
  964. begin
  965. if ref.shiftmode<>SM_None then
  966. internalerror(200308294);
  967. ref.base:=ref.index;
  968. ref.index:=NR_NO;
  969. end;
  970. { absolute symbols can't be handled directly, we've to store the symbol reference
  971. in the text segment and access it pc relative
  972. For now, we assume that references where base or index equals to PC are already
  973. relative, all other references are assumed to be absolute and thus they need
  974. to be handled extra.
  975. A proper solution would be to change refoptions to a set and store the information
  976. if the symbol is absolute or relative there.
  977. }
  978. if (assigned(ref.symbol) and
  979. not(is_pc(ref.base)) and
  980. not(is_pc(ref.index))
  981. ) or
  982. { [#xxx] isn't a valid address operand }
  983. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  984. (ref.offset<-4095) or
  985. (ref.offset>4095) or
  986. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  987. ((ref.offset<-255) or
  988. (ref.offset>255)
  989. )
  990. ) or
  991. ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) and
  992. ((ref.offset<-1020) or
  993. (ref.offset>1020) or
  994. ((abs(ref.offset) mod 4)<>0)
  995. )
  996. ) or
  997. ((current_settings.cputype in cpu_thumb) and
  998. (((oppostfix in [PF_SB,PF_SH]) and (ref.offset<>0)) or
  999. ((oppostfix=PF_None) and ((ref.offset<0) or (ref.offset>124) or ((ref.offset mod 4)<>0))) or
  1000. ((oppostfix=PF_H) and ((ref.offset<0) or (ref.offset>62) or ((ref.offset mod 2)<>0))) or
  1001. ((oppostfix=PF_B) and ((ref.offset<0) or (ref.offset>31)))
  1002. )
  1003. ) then
  1004. begin
  1005. fixref(list,ref);
  1006. end;
  1007. { certain thumb load require base and index }
  1008. if (current_settings.cputype in cpu_thumb) and
  1009. (oppostfix in [PF_SB,PF_SH]) and
  1010. (ref.base<>NR_NO) and (ref.index=NR_NO) then
  1011. begin
  1012. tmpreg:=getintregister(list,OS_ADDR);
  1013. a_load_const_reg(list,OS_INT,0,tmpreg);
  1014. ref.index:=tmpreg;
  1015. end;
  1016. { fold if there is base, index and offset, however, don't fold
  1017. for vfp memory instructions because we later fold the index }
  1018. if not(op in [A_FLDS,A_FLDD,A_FSTS,A_FSTD]) and
  1019. (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  1020. begin
  1021. if tmpreg<>NR_NO then
  1022. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg,tmpreg)
  1023. else
  1024. begin
  1025. tmpreg:=getintregister(list,OS_ADDR);
  1026. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg);
  1027. ref.base:=tmpreg;
  1028. end;
  1029. ref.offset:=0;
  1030. end;
  1031. { floating point operations have only limited references
  1032. we expect here, that a base is already set }
  1033. if (op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) and (ref.index<>NR_NO) then
  1034. begin
  1035. if ref.shiftmode<>SM_none then
  1036. internalerror(200309121);
  1037. if tmpreg<>NR_NO then
  1038. begin
  1039. if ref.base=tmpreg then
  1040. begin
  1041. if ref.signindex<0 then
  1042. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,tmpreg,ref.index))
  1043. else
  1044. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,tmpreg,ref.index));
  1045. ref.index:=NR_NO;
  1046. end
  1047. else
  1048. begin
  1049. if ref.index<>tmpreg then
  1050. internalerror(200403161);
  1051. if ref.signindex<0 then
  1052. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,ref.base,tmpreg))
  1053. else
  1054. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  1055. ref.base:=tmpreg;
  1056. ref.index:=NR_NO;
  1057. end;
  1058. end
  1059. else
  1060. begin
  1061. tmpreg:=getintregister(list,OS_ADDR);
  1062. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));
  1063. ref.base:=tmpreg;
  1064. ref.index:=NR_NO;
  1065. end;
  1066. end;
  1067. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  1068. Result := ref;
  1069. end;
  1070. procedure tbasecgarm.a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);
  1071. var
  1072. oppostfix:toppostfix;
  1073. usedtmpref: treference;
  1074. tmpreg : tregister;
  1075. dir : integer;
  1076. begin
  1077. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  1078. FromSize := ToSize;
  1079. case ToSize of
  1080. { signed integer registers }
  1081. OS_8,
  1082. OS_S8:
  1083. oppostfix:=PF_B;
  1084. OS_16,
  1085. OS_S16:
  1086. oppostfix:=PF_H;
  1087. OS_32,
  1088. OS_S32,
  1089. { for vfp value stored in integer register }
  1090. OS_F32:
  1091. oppostfix:=PF_None;
  1092. else
  1093. InternalError(200308299);
  1094. end;
  1095. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[tosize]) then
  1096. begin
  1097. if target_info.endian=endian_big then
  1098. dir:=-1
  1099. else
  1100. dir:=1;
  1101. case FromSize of
  1102. OS_16,OS_S16:
  1103. begin
  1104. tmpreg:=getintregister(list,OS_INT);
  1105. usedtmpref:=ref;
  1106. if target_info.endian=endian_big then
  1107. inc(usedtmpref.offset,1);
  1108. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1109. inc(usedtmpref.offset,dir);
  1110. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1111. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1112. end;
  1113. OS_32,OS_S32:
  1114. begin
  1115. tmpreg:=getintregister(list,OS_INT);
  1116. usedtmpref:=ref;
  1117. if ref.alignment=2 then
  1118. begin
  1119. if target_info.endian=endian_big then
  1120. inc(usedtmpref.offset,2);
  1121. usedtmpref:=a_internal_load_reg_ref(list,OS_16,OS_16,reg,usedtmpref);
  1122. a_op_const_reg_reg(list,OP_SHR,OS_INT,16,reg,tmpreg);
  1123. inc(usedtmpref.offset,dir*2);
  1124. a_internal_load_reg_ref(list,OS_16,OS_16,tmpreg,usedtmpref);
  1125. end
  1126. else
  1127. begin
  1128. if target_info.endian=endian_big then
  1129. inc(usedtmpref.offset,3);
  1130. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1131. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1132. inc(usedtmpref.offset,dir);
  1133. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1134. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1135. inc(usedtmpref.offset,dir);
  1136. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1137. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1138. inc(usedtmpref.offset,dir);
  1139. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1140. end;
  1141. end
  1142. else
  1143. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1144. end;
  1145. end
  1146. else
  1147. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1148. end;
  1149. function tbasecgarm.a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  1150. var
  1151. oppostfix:toppostfix;
  1152. begin
  1153. case ToSize of
  1154. { signed integer registers }
  1155. OS_8,
  1156. OS_S8:
  1157. oppostfix:=PF_B;
  1158. OS_16,
  1159. OS_S16:
  1160. oppostfix:=PF_H;
  1161. OS_32,
  1162. OS_S32:
  1163. oppostfix:=PF_None;
  1164. else
  1165. InternalError(2003082910);
  1166. end;
  1167. result:=handle_load_store(list,A_STR,oppostfix,reg,ref);
  1168. end;
  1169. function tbasecgarm.a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  1170. var
  1171. oppostfix:toppostfix;
  1172. begin
  1173. case FromSize of
  1174. { signed integer registers }
  1175. OS_8:
  1176. oppostfix:=PF_B;
  1177. OS_S8:
  1178. oppostfix:=PF_SB;
  1179. OS_16:
  1180. oppostfix:=PF_H;
  1181. OS_S16:
  1182. oppostfix:=PF_SH;
  1183. OS_32,
  1184. OS_S32:
  1185. oppostfix:=PF_None;
  1186. else
  1187. InternalError(200308291);
  1188. end;
  1189. result:=handle_load_store(list,A_LDR,oppostfix,reg,ref);
  1190. end;
  1191. procedure tbasecgarm.a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);
  1192. var
  1193. so : tshifterop;
  1194. procedure do_shift(shiftmode : tshiftmode; shiftimm : byte; reg : tregister);
  1195. begin
  1196. so.shiftmode:=shiftmode;
  1197. so.shiftimm:=shiftimm;
  1198. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,reg2,reg,so));
  1199. end;
  1200. var
  1201. instr: taicpu;
  1202. conv_done: boolean;
  1203. begin
  1204. if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then
  1205. internalerror(2002090901);
  1206. conv_done:=false;
  1207. if tosize<>fromsize then
  1208. begin
  1209. shifterop_reset(so);
  1210. conv_done:=true;
  1211. if tcgsize2size[tosize]<=tcgsize2size[fromsize] then
  1212. fromsize:=tosize;
  1213. if current_settings.cputype<cpu_armv6 then
  1214. case fromsize of
  1215. OS_8:
  1216. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1217. OS_S8:
  1218. begin
  1219. do_shift(SM_LSL,24,reg1);
  1220. if tosize=OS_16 then
  1221. begin
  1222. do_shift(SM_ASR,8,reg2);
  1223. do_shift(SM_LSR,16,reg2);
  1224. end
  1225. else
  1226. do_shift(SM_ASR,24,reg2);
  1227. end;
  1228. OS_16:
  1229. begin
  1230. do_shift(SM_LSL,16,reg1);
  1231. do_shift(SM_LSR,16,reg2);
  1232. end;
  1233. OS_S16:
  1234. begin
  1235. do_shift(SM_LSL,16,reg1);
  1236. do_shift(SM_ASR,16,reg2)
  1237. end;
  1238. else
  1239. conv_done:=false;
  1240. end
  1241. else
  1242. case fromsize of
  1243. OS_8:
  1244. if current_settings.cputype in cpu_thumb then
  1245. list.concat(taicpu.op_reg_reg(A_UXTB,reg2,reg1))
  1246. else
  1247. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1248. OS_S8:
  1249. begin
  1250. if tosize=OS_16 then
  1251. begin
  1252. so.shiftmode:=SM_ROR;
  1253. so.shiftimm:=16;
  1254. list.concat(taicpu.op_reg_reg_shifterop(A_SXTB16,reg2,reg1,so));
  1255. do_shift(SM_LSR,16,reg2);
  1256. end
  1257. else
  1258. list.concat(taicpu.op_reg_reg(A_SXTB,reg2,reg1));
  1259. end;
  1260. OS_16:
  1261. list.concat(taicpu.op_reg_reg(A_UXTH,reg2,reg1));
  1262. OS_S16:
  1263. list.concat(taicpu.op_reg_reg(A_SXTH,reg2,reg1));
  1264. else
  1265. conv_done:=false;
  1266. end
  1267. end;
  1268. if not conv_done and (reg1<>reg2) then
  1269. begin
  1270. { same size, only a register mov required }
  1271. instr:=taicpu.op_reg_reg(A_MOV,reg2,reg1);
  1272. list.Concat(instr);
  1273. { Notify the register allocator that we have written a move instruction so
  1274. it can try to eliminate it. }
  1275. add_move_instruction(instr);
  1276. end;
  1277. end;
  1278. procedure tbasecgarm.a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);
  1279. var
  1280. href,href2 : treference;
  1281. hloc : pcgparalocation;
  1282. begin
  1283. href:=ref;
  1284. hloc:=paraloc.location;
  1285. while assigned(hloc) do
  1286. begin
  1287. case hloc^.loc of
  1288. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  1289. begin
  1290. paramanager.allocparaloc(list,paraloc.location);
  1291. a_loadfpu_ref_reg(list,size,size,ref,hloc^.register);
  1292. end;
  1293. LOC_REGISTER :
  1294. case hloc^.size of
  1295. OS_32,
  1296. OS_F32:
  1297. begin
  1298. paramanager.allocparaloc(list,paraloc.location);
  1299. a_load_ref_reg(list,OS_32,OS_32,href,hloc^.register);
  1300. end;
  1301. OS_64,
  1302. OS_F64:
  1303. cg64.a_load64_ref_cgpara(list,href,paraloc);
  1304. else
  1305. a_load_ref_reg(list,hloc^.size,hloc^.size,href,hloc^.register);
  1306. end;
  1307. LOC_REFERENCE :
  1308. begin
  1309. reference_reset_base(href2,hloc^.reference.index,hloc^.reference.offset,paraloc.alignment);
  1310. { concatcopy should choose the best way to copy the data }
  1311. g_concatcopy(list,href,href2,tcgsize2size[hloc^.size]);
  1312. end;
  1313. else
  1314. internalerror(200408241);
  1315. end;
  1316. inc(href.offset,tcgsize2size[hloc^.size]);
  1317. hloc:=hloc^.next;
  1318. end;
  1319. end;
  1320. procedure tbasecgarm.a_loadfpu_reg_reg(list: TAsmList; fromsize,tosize: tcgsize; reg1, reg2: tregister);
  1321. begin
  1322. list.concat(setoppostfix(taicpu.op_reg_reg(A_MVF,reg2,reg1),cgsize2fpuoppostfix[tosize]));
  1323. end;
  1324. procedure tbasecgarm.a_loadfpu_ref_reg(list: TAsmList; fromsize,tosize: tcgsize; const ref: treference; reg: tregister);
  1325. var
  1326. oppostfix:toppostfix;
  1327. begin
  1328. case fromsize of
  1329. OS_32,
  1330. OS_F32:
  1331. oppostfix:=PF_S;
  1332. OS_64,
  1333. OS_F64:
  1334. oppostfix:=PF_D;
  1335. OS_F80:
  1336. oppostfix:=PF_E;
  1337. else
  1338. InternalError(200309021);
  1339. end;
  1340. handle_load_store(list,A_LDF,oppostfix,reg,ref);
  1341. if fromsize<>tosize then
  1342. a_loadfpu_reg_reg(list,fromsize,tosize,reg,reg);
  1343. end;
  1344. procedure tbasecgarm.a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);
  1345. var
  1346. oppostfix:toppostfix;
  1347. begin
  1348. case tosize of
  1349. OS_F32:
  1350. oppostfix:=PF_S;
  1351. OS_F64:
  1352. oppostfix:=PF_D;
  1353. OS_F80:
  1354. oppostfix:=PF_E;
  1355. else
  1356. InternalError(200309022);
  1357. end;
  1358. handle_load_store(list,A_STF,oppostfix,reg,ref);
  1359. end;
  1360. { comparison operations }
  1361. procedure tbasecgarm.a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  1362. l : tasmlabel);
  1363. var
  1364. tmpreg : tregister;
  1365. b : byte;
  1366. begin
  1367. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1368. if (not(current_settings.cputype in cpu_thumb) and is_shifter_const(a,b)) or
  1369. ((current_settings.cputype in cpu_thumb) and is_thumb_imm(a)) then
  1370. list.concat(taicpu.op_reg_const(A_CMP,reg,a))
  1371. { CMN reg,0 and CMN reg,$80000000 are different from CMP reg,$ffffffff
  1372. and CMP reg,$7fffffff regarding the flags according to the ARM manual }
  1373. else if (a<>$7fffffff) and (a<>-1) and not(current_settings.cputype in cpu_thumb) and is_shifter_const(-a,b) then
  1374. list.concat(taicpu.op_reg_const(A_CMN,reg,-a))
  1375. else
  1376. begin
  1377. tmpreg:=getintregister(list,size);
  1378. a_load_const_reg(list,size,a,tmpreg);
  1379. list.concat(taicpu.op_reg_reg(A_CMP,reg,tmpreg));
  1380. end;
  1381. a_jmp_cond(list,cmp_op,l);
  1382. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1383. end;
  1384. procedure tbasecgarm.a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; size: TCGSize; src, dst: TRegister);
  1385. begin
  1386. if reverse then
  1387. begin
  1388. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,src));
  1389. list.Concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,31));
  1390. list.Concat(taicpu.op_reg_reg_const(A_AND,dst,dst,255));
  1391. end
  1392. { it is decided during the compilation of the system unit if this code is used or not
  1393. so no additional check for rbit is needed }
  1394. else
  1395. begin
  1396. list.Concat(taicpu.op_reg_reg(A_RBIT,dst,src));
  1397. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,dst));
  1398. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1399. list.Concat(taicpu.op_reg_const(A_CMP,dst,32));
  1400. if current_settings.cputype in cpu_thumb2 then
  1401. list.Concat(taicpu.op_cond(A_IT, C_EQ));
  1402. list.Concat(setcondition(taicpu.op_reg_const(A_MOV,dst,$ff),C_EQ));
  1403. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1404. end;
  1405. end;
  1406. procedure tbasecgarm.a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel);
  1407. begin
  1408. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1409. list.concat(taicpu.op_reg_reg(A_CMP,reg2,reg1));
  1410. a_jmp_cond(list,cmp_op,l);
  1411. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1412. end;
  1413. procedure tbasecgarm.a_jmp_name(list : TAsmList;const s : string);
  1414. var
  1415. ai : taicpu;
  1416. begin
  1417. { generate far jump, leave it to the optimizer to get rid of it }
  1418. if current_settings.cputype in cpu_thumb then
  1419. ai:=taicpu.op_sym(A_BL,current_asmdata.RefAsmSymbol(s))
  1420. else
  1421. ai:=taicpu.op_sym(A_B,current_asmdata.RefAsmSymbol(s));
  1422. ai.is_jmp:=true;
  1423. list.concat(ai);
  1424. end;
  1425. procedure tbasecgarm.a_jmp_always(list : TAsmList;l: tasmlabel);
  1426. var
  1427. ai : taicpu;
  1428. begin
  1429. { generate far jump, leave it to the optimizer to get rid of it }
  1430. if current_settings.cputype in cpu_thumb then
  1431. ai:=taicpu.op_sym(A_BL,l)
  1432. else
  1433. ai:=taicpu.op_sym(A_B,l);
  1434. ai.is_jmp:=true;
  1435. list.concat(ai);
  1436. end;
  1437. procedure tbasecgarm.a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel);
  1438. var
  1439. ai : taicpu;
  1440. inv_flags : TResFlags;
  1441. hlabel : TAsmLabel;
  1442. begin
  1443. if current_settings.cputype in cpu_thumb then
  1444. begin
  1445. inv_flags:=f;
  1446. inverse_flags(inv_flags);
  1447. { the optimizer has to fix this if jump range is sufficient short }
  1448. current_asmdata.getjumplabel(hlabel);
  1449. ai:=setcondition(taicpu.op_sym(A_B,hlabel),flags_to_cond(inv_flags));
  1450. ai.is_jmp:=true;
  1451. list.concat(ai);
  1452. a_jmp_always(list,l);
  1453. a_label(list,hlabel);
  1454. end
  1455. else
  1456. begin
  1457. ai:=setcondition(taicpu.op_sym(A_B,l),flags_to_cond(f));
  1458. ai.is_jmp:=true;
  1459. list.concat(ai);
  1460. end;
  1461. end;
  1462. procedure tbasecgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  1463. begin
  1464. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  1465. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  1466. end;
  1467. procedure tbasecgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  1468. var
  1469. ref : treference;
  1470. shift : byte;
  1471. firstfloatreg,lastfloatreg,
  1472. r : byte;
  1473. mmregs,
  1474. regs, saveregs : tcpuregisterset;
  1475. r7offset,
  1476. stackmisalignment : pint;
  1477. postfix: toppostfix;
  1478. imm1, imm2: DWord;
  1479. begin
  1480. LocalSize:=align(LocalSize,4);
  1481. { call instruction does not put anything on the stack }
  1482. stackmisalignment:=0;
  1483. if not(nostackframe) then
  1484. begin
  1485. firstfloatreg:=RS_NO;
  1486. mmregs:=[];
  1487. case current_settings.fputype of
  1488. fpu_fpa,
  1489. fpu_fpa10,
  1490. fpu_fpa11:
  1491. begin
  1492. { save floating point registers? }
  1493. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1494. for r:=RS_F0 to RS_F7 do
  1495. if r in regs then
  1496. begin
  1497. if firstfloatreg=RS_NO then
  1498. firstfloatreg:=r;
  1499. lastfloatreg:=r;
  1500. inc(stackmisalignment,12);
  1501. end;
  1502. end;
  1503. fpu_vfpv2,
  1504. fpu_vfpv3,
  1505. fpu_vfpv3_d16:
  1506. begin;
  1507. mmregs:=rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall);
  1508. end;
  1509. end;
  1510. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1511. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1512. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  1513. { save int registers }
  1514. reference_reset(ref,4);
  1515. ref.index:=NR_STACK_POINTER_REG;
  1516. ref.addressmode:=AM_PREINDEXED;
  1517. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  1518. if not(target_info.system in systems_darwin) then
  1519. begin
  1520. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1521. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1522. begin
  1523. a_reg_alloc(list,NR_R12);
  1524. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  1525. end;
  1526. { the (old) ARM APCS requires saving both the stack pointer (to
  1527. crawl the stack) and the PC (to identify the function this
  1528. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  1529. and R15 -- still needs updating for EABI and Darwin, they don't
  1530. need that }
  1531. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1532. regs:=regs+[RS_FRAME_POINTER_REG,RS_R12,RS_R14,RS_R15]
  1533. else
  1534. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1535. include(regs,RS_R14);
  1536. if regs<>[] then
  1537. begin
  1538. for r:=RS_R0 to RS_R15 do
  1539. if r in regs then
  1540. inc(stackmisalignment,4);
  1541. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  1542. end;
  1543. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1544. begin
  1545. { the framepointer now points to the saved R15, so the saved
  1546. framepointer is at R11-12 (for get_caller_frame) }
  1547. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  1548. a_reg_dealloc(list,NR_R12);
  1549. end;
  1550. end
  1551. else
  1552. begin
  1553. { always save r14 if we use r7 as the framepointer, because
  1554. the parameter offsets are hardcoded in advance and always
  1555. assume that r14 sits on the stack right behind the saved r7
  1556. }
  1557. if current_procinfo.framepointer=NR_FRAME_POINTER_REG then
  1558. include(regs,RS_FRAME_POINTER_REG);
  1559. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1560. include(regs,RS_R14);
  1561. if regs<>[] then
  1562. begin
  1563. { on Darwin, you first have to save [r4-r7,lr], and then
  1564. [r8,r10,r11] and make r7 point to the previously saved
  1565. r7 so that you can perform a stack crawl based on it
  1566. ([r7] is previous stack frame, [r7+4] is return address
  1567. }
  1568. include(regs,RS_FRAME_POINTER_REG);
  1569. saveregs:=regs-[RS_R8,RS_R10,RS_R11];
  1570. r7offset:=0;
  1571. for r:=RS_R0 to RS_R15 do
  1572. if r in saveregs then
  1573. begin
  1574. inc(stackmisalignment,4);
  1575. if r<RS_FRAME_POINTER_REG then
  1576. inc(r7offset,4);
  1577. end;
  1578. { save the registers }
  1579. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1580. { make r7 point to the saved r7 (regardless of whether this
  1581. frame uses the framepointer, for backtrace purposes) }
  1582. if r7offset<>0 then
  1583. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_FRAME_POINTER_REG,NR_R13,r7offset))
  1584. else
  1585. list.concat(taicpu.op_reg_reg(A_MOV,NR_R7,NR_R13));
  1586. { now save the rest (if any) }
  1587. saveregs:=regs-saveregs;
  1588. if saveregs<>[] then
  1589. begin
  1590. for r:=RS_R8 to RS_R11 do
  1591. if r in saveregs then
  1592. inc(stackmisalignment,4);
  1593. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1594. end;
  1595. end;
  1596. end;
  1597. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  1598. if (LocalSize<>0) or
  1599. ((stackmisalignment<>0) and
  1600. ((pi_do_call in current_procinfo.flags) or
  1601. (po_assembler in current_procinfo.procdef.procoptions))) then
  1602. begin
  1603. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  1604. if is_shifter_const(localsize,shift) then
  1605. begin
  1606. a_reg_dealloc(list,NR_R12);
  1607. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  1608. end
  1609. else if split_into_shifter_const(localsize, imm1, imm2) then
  1610. begin
  1611. a_reg_dealloc(list,NR_R12);
  1612. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  1613. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  1614. end
  1615. else
  1616. begin
  1617. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  1618. a_reg_alloc(list,NR_R12);
  1619. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  1620. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  1621. a_reg_dealloc(list,NR_R12);
  1622. end;
  1623. end;
  1624. if (mmregs<>[]) or
  1625. (firstfloatreg<>RS_NO) then
  1626. begin
  1627. reference_reset(ref,4);
  1628. if (tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023) or
  1629. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv3_d16]) then
  1630. begin
  1631. if not is_shifter_const(tarmprocinfo(current_procinfo).floatregstart,shift) then
  1632. begin
  1633. a_reg_alloc(list,NR_R12);
  1634. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  1635. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1636. a_reg_dealloc(list,NR_R12);
  1637. end
  1638. else
  1639. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tarmprocinfo(current_procinfo).floatregstart));
  1640. ref.base:=NR_R12;
  1641. end
  1642. else
  1643. begin
  1644. ref.base:=current_procinfo.framepointer;
  1645. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  1646. end;
  1647. case current_settings.fputype of
  1648. fpu_fpa,
  1649. fpu_fpa10,
  1650. fpu_fpa11:
  1651. begin
  1652. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  1653. lastfloatreg-firstfloatreg+1,ref));
  1654. end;
  1655. fpu_vfpv2,
  1656. fpu_vfpv3,
  1657. fpu_vfpv3_d16:
  1658. begin
  1659. ref.index:=ref.base;
  1660. ref.base:=NR_NO;
  1661. { FSTMX is deprecated on ARMv6 and later }
  1662. if (current_settings.cputype<cpu_armv6) then
  1663. postfix:=PF_IAX
  1664. else
  1665. postfix:=PF_IAD;
  1666. list.concat(setoppostfix(taicpu.op_ref_regset(A_FSTM,ref,R_MMREGISTER,R_SUBFD,mmregs),postfix));
  1667. end;
  1668. end;
  1669. end;
  1670. end;
  1671. end;
  1672. procedure tbasecgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  1673. var
  1674. ref : treference;
  1675. LocalSize : longint;
  1676. firstfloatreg,lastfloatreg,
  1677. r,
  1678. shift : byte;
  1679. mmregs,
  1680. saveregs,
  1681. regs : tcpuregisterset;
  1682. stackmisalignment: pint;
  1683. mmpostfix: toppostfix;
  1684. imm1, imm2: DWord;
  1685. begin
  1686. if not(nostackframe) then
  1687. begin
  1688. stackmisalignment:=0;
  1689. firstfloatreg:=RS_NO;
  1690. mmregs:=[];
  1691. case current_settings.fputype of
  1692. fpu_fpa,
  1693. fpu_fpa10,
  1694. fpu_fpa11:
  1695. begin
  1696. { restore floating point registers? }
  1697. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1698. for r:=RS_F0 to RS_F7 do
  1699. if r in regs then
  1700. begin
  1701. if firstfloatreg=RS_NO then
  1702. firstfloatreg:=r;
  1703. lastfloatreg:=r;
  1704. { floating point register space is already included in
  1705. localsize below by calc_stackframe_size
  1706. inc(stackmisalignment,12);
  1707. }
  1708. end;
  1709. end;
  1710. fpu_vfpv2,
  1711. fpu_vfpv3,
  1712. fpu_vfpv3_d16:
  1713. begin;
  1714. { restore vfp registers? }
  1715. mmregs:=rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall);
  1716. end;
  1717. end;
  1718. if (firstfloatreg<>RS_NO) or
  1719. (mmregs<>[]) then
  1720. begin
  1721. reference_reset(ref,4);
  1722. if (tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023) or
  1723. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv3_d16]) then
  1724. begin
  1725. if not is_shifter_const(tarmprocinfo(current_procinfo).floatregstart,shift) then
  1726. begin
  1727. a_reg_alloc(list,NR_R12);
  1728. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  1729. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1730. a_reg_dealloc(list,NR_R12);
  1731. end
  1732. else
  1733. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tarmprocinfo(current_procinfo).floatregstart));
  1734. ref.base:=NR_R12;
  1735. end
  1736. else
  1737. begin
  1738. ref.base:=current_procinfo.framepointer;
  1739. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  1740. end;
  1741. case current_settings.fputype of
  1742. fpu_fpa,
  1743. fpu_fpa10,
  1744. fpu_fpa11:
  1745. begin
  1746. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  1747. lastfloatreg-firstfloatreg+1,ref));
  1748. end;
  1749. fpu_vfpv2,
  1750. fpu_vfpv3,
  1751. fpu_vfpv3_d16:
  1752. begin
  1753. ref.index:=ref.base;
  1754. ref.base:=NR_NO;
  1755. { FLDMX is deprecated on ARMv6 and later }
  1756. if (current_settings.cputype<cpu_armv6) then
  1757. mmpostfix:=PF_IAX
  1758. else
  1759. mmpostfix:=PF_IAD;
  1760. list.concat(setoppostfix(taicpu.op_ref_regset(A_FLDM,ref,R_MMREGISTER,R_SUBFD,mmregs),mmpostfix));
  1761. end;
  1762. end;
  1763. end;
  1764. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall) ;
  1765. if (pi_do_call in current_procinfo.flags) or
  1766. (regs<>[]) or
  1767. ((target_info.system in systems_darwin) and
  1768. (current_procinfo.framepointer<>NR_STACK_POINTER_REG)) then
  1769. begin
  1770. exclude(regs,RS_R14);
  1771. include(regs,RS_R15);
  1772. if (target_info.system in systems_darwin) then
  1773. include(regs,RS_FRAME_POINTER_REG);
  1774. end;
  1775. if not(target_info.system in systems_darwin) then
  1776. begin
  1777. { restore saved stack pointer to SP (R13) and saved lr to PC (R15).
  1778. The saved PC came after that but is discarded, since we restore
  1779. the stack pointer }
  1780. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  1781. regs:=regs+[RS_FRAME_POINTER_REG,RS_R13,RS_R15];
  1782. end
  1783. else
  1784. begin
  1785. { restore R8-R11 already if necessary (they've been stored
  1786. before the others) }
  1787. saveregs:=regs*[RS_R8,RS_R10,RS_R11];
  1788. if saveregs<>[] then
  1789. begin
  1790. reference_reset(ref,4);
  1791. ref.index:=NR_STACK_POINTER_REG;
  1792. ref.addressmode:=AM_PREINDEXED;
  1793. for r:=RS_R8 to RS_R11 do
  1794. if r in saveregs then
  1795. inc(stackmisalignment,4);
  1796. regs:=regs-saveregs;
  1797. end;
  1798. end;
  1799. for r:=RS_R0 to RS_R15 do
  1800. if r in regs then
  1801. inc(stackmisalignment,4);
  1802. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  1803. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  1804. (target_info.system in systems_darwin) then
  1805. begin
  1806. LocalSize:=current_procinfo.calc_stackframe_size;
  1807. if (LocalSize<>0) or
  1808. ((stackmisalignment<>0) and
  1809. ((pi_do_call in current_procinfo.flags) or
  1810. (po_assembler in current_procinfo.procdef.procoptions))) then
  1811. begin
  1812. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  1813. if is_shifter_const(LocalSize,shift) then
  1814. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  1815. else if split_into_shifter_const(localsize, imm1, imm2) then
  1816. begin
  1817. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  1818. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  1819. end
  1820. else
  1821. begin
  1822. a_reg_alloc(list,NR_R12);
  1823. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  1824. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  1825. a_reg_dealloc(list,NR_R12);
  1826. end;
  1827. end;
  1828. if (target_info.system in systems_darwin) and
  1829. (saveregs<>[]) then
  1830. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1831. if regs=[] then
  1832. begin
  1833. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  1834. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  1835. else
  1836. list.concat(taicpu.op_reg(A_BX,NR_R14))
  1837. end
  1838. else
  1839. begin
  1840. reference_reset(ref,4);
  1841. ref.index:=NR_STACK_POINTER_REG;
  1842. ref.addressmode:=AM_PREINDEXED;
  1843. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  1844. end;
  1845. end
  1846. else
  1847. begin
  1848. { restore int registers and return }
  1849. reference_reset(ref,4);
  1850. ref.index:=NR_FRAME_POINTER_REG;
  1851. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_EA));
  1852. end;
  1853. end
  1854. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  1855. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  1856. else
  1857. list.concat(taicpu.op_reg(A_BX,NR_R14))
  1858. end;
  1859. procedure tbasecgarm.a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);
  1860. var
  1861. b : byte;
  1862. tmpref : treference;
  1863. instr : taicpu;
  1864. begin
  1865. if ref.addressmode<>AM_OFFSET then
  1866. internalerror(200309071);
  1867. tmpref:=ref;
  1868. { Be sure to have a base register }
  1869. if (tmpref.base=NR_NO) then
  1870. begin
  1871. if tmpref.shiftmode<>SM_None then
  1872. internalerror(200308294);
  1873. if tmpref.signindex<0 then
  1874. internalerror(200312023);
  1875. tmpref.base:=tmpref.index;
  1876. tmpref.index:=NR_NO;
  1877. end;
  1878. if assigned(tmpref.symbol) or
  1879. not((is_shifter_const(tmpref.offset,b)) or
  1880. (is_shifter_const(-tmpref.offset,b))
  1881. ) then
  1882. fixref(list,tmpref);
  1883. { expect a base here if there is an index }
  1884. if (tmpref.base=NR_NO) and (tmpref.index<>NR_NO) then
  1885. internalerror(200312022);
  1886. if tmpref.index<>NR_NO then
  1887. begin
  1888. if tmpref.shiftmode<>SM_None then
  1889. internalerror(200312021);
  1890. if tmpref.signindex<0 then
  1891. a_op_reg_reg_reg(list,OP_SUB,OS_ADDR,tmpref.base,tmpref.index,r)
  1892. else
  1893. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpref.base,tmpref.index,r);
  1894. if tmpref.offset<>0 then
  1895. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,r,r);
  1896. end
  1897. else
  1898. begin
  1899. if tmpref.base=NR_NO then
  1900. a_load_const_reg(list,OS_ADDR,tmpref.offset,r)
  1901. else
  1902. if tmpref.offset<>0 then
  1903. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,tmpref.base,r)
  1904. else
  1905. begin
  1906. instr:=taicpu.op_reg_reg(A_MOV,r,tmpref.base);
  1907. list.concat(instr);
  1908. add_move_instruction(instr);
  1909. end;
  1910. end;
  1911. end;
  1912. procedure tbasecgarm.fixref(list : TAsmList;var ref : treference);
  1913. var
  1914. tmpreg : tregister;
  1915. tmpref : treference;
  1916. l : tasmlabel;
  1917. indirection_done : boolean;
  1918. begin
  1919. { absolute symbols can't be handled directly, we've to store the symbol reference
  1920. in the text segment and access it pc relative
  1921. For now, we assume that references where base or index equals to PC are already
  1922. relative, all other references are assumed to be absolute and thus they need
  1923. to be handled extra.
  1924. A proper solution would be to change refoptions to a set and store the information
  1925. if the symbol is absolute or relative there.
  1926. }
  1927. { create consts entry }
  1928. reference_reset(tmpref,4);
  1929. current_asmdata.getjumplabel(l);
  1930. cg.a_label(current_procinfo.aktlocaldata,l);
  1931. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  1932. indirection_done:=false;
  1933. if assigned(ref.symbol) then
  1934. begin
  1935. if (target_info.system=system_arm_darwin) and
  1936. (ref.symbol.bind in [AB_EXTERNAL,AB_WEAK_EXTERNAL,AB_PRIVATE_EXTERN,AB_COMMON]) then
  1937. begin
  1938. tmpreg:=g_indirect_sym_load(list,ref.symbol.name,asmsym2indsymflags(ref.symbol));
  1939. if ref.offset<>0 then
  1940. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  1941. indirection_done:=true;
  1942. end
  1943. else
  1944. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset))
  1945. end
  1946. else
  1947. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ref.offset));
  1948. { load consts entry }
  1949. if not indirection_done then
  1950. begin
  1951. tmpreg:=getintregister(list,OS_INT);
  1952. tmpref.symbol:=l;
  1953. tmpref.base:=NR_PC;
  1954. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  1955. end;
  1956. { This routine can be called with PC as base/index in case the offset
  1957. was too large to encode in a load/store. In that case, the entire
  1958. absolute expression has been re-encoded in a new constpool entry, and
  1959. we have to remove the use of PC from the original reference (the code
  1960. above made everything relative to the value loaded from the new
  1961. constpool entry) }
  1962. if is_pc(ref.base) then
  1963. ref.base:=NR_NO;
  1964. if is_pc(ref.index) then
  1965. ref.index:=NR_NO;
  1966. if (ref.base<>NR_NO) then
  1967. begin
  1968. if ref.index<>NR_NO then
  1969. begin
  1970. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  1971. ref.base:=tmpreg;
  1972. end
  1973. else
  1974. if ref.base<>NR_PC then
  1975. begin
  1976. ref.index:=tmpreg;
  1977. ref.shiftimm:=0;
  1978. ref.signindex:=1;
  1979. ref.shiftmode:=SM_None;
  1980. end
  1981. else
  1982. ref.base:=tmpreg;
  1983. end
  1984. else
  1985. ref.base:=tmpreg;
  1986. ref.offset:=0;
  1987. ref.symbol:=nil;
  1988. end;
  1989. procedure tbasecgarm.g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  1990. var
  1991. paraloc1,paraloc2,paraloc3 : TCGPara;
  1992. pd : tprocdef;
  1993. begin
  1994. pd:=search_system_proc('MOVE');
  1995. paraloc1.init;
  1996. paraloc2.init;
  1997. paraloc3.init;
  1998. paramanager.getintparaloc(pd,1,paraloc1);
  1999. paramanager.getintparaloc(pd,2,paraloc2);
  2000. paramanager.getintparaloc(pd,3,paraloc3);
  2001. a_load_const_cgpara(list,OS_SINT,len,paraloc3);
  2002. a_loadaddr_ref_cgpara(list,dest,paraloc2);
  2003. a_loadaddr_ref_cgpara(list,source,paraloc1);
  2004. paramanager.freecgpara(list,paraloc3);
  2005. paramanager.freecgpara(list,paraloc2);
  2006. paramanager.freecgpara(list,paraloc1);
  2007. alloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2008. alloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2009. a_call_name(list,'FPC_MOVE',false);
  2010. dealloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2011. dealloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2012. paraloc3.done;
  2013. paraloc2.done;
  2014. paraloc1.done;
  2015. end;
  2016. procedure tbasecgarm.g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  2017. const
  2018. maxtmpreg_arm = 10; {roozbeh: can be reduced to 8 or lower if might conflick with reserved ones,also +2 is used becouse of regs required for referencing}
  2019. maxtmpreg_thumb = 5;
  2020. var
  2021. srcref,dstref,usedtmpref,usedtmpref2:treference;
  2022. srcreg,destreg,countreg,r,tmpreg:tregister;
  2023. helpsize:aint;
  2024. copysize:byte;
  2025. cgsize:Tcgsize;
  2026. tmpregisters:array[1..maxtmpreg_arm] of tregister;
  2027. maxtmpreg,
  2028. tmpregi,tmpregi2:byte;
  2029. { will never be called with count<=4 }
  2030. procedure genloop(count : aword;size : byte);
  2031. const
  2032. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2033. var
  2034. l : tasmlabel;
  2035. begin
  2036. current_asmdata.getjumplabel(l);
  2037. if count<size then size:=1;
  2038. a_load_const_reg(list,OS_INT,count div size,countreg);
  2039. cg.a_label(list,l);
  2040. srcref.addressmode:=AM_POSTINDEXED;
  2041. dstref.addressmode:=AM_POSTINDEXED;
  2042. srcref.offset:=size;
  2043. dstref.offset:=size;
  2044. r:=getintregister(list,size2opsize[size]);
  2045. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2046. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2047. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1),PF_S));
  2048. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2049. a_jmp_flags(list,F_NE,l);
  2050. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2051. srcref.offset:=1;
  2052. dstref.offset:=1;
  2053. case count mod size of
  2054. 1:
  2055. begin
  2056. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2057. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2058. end;
  2059. 2:
  2060. if aligned then
  2061. begin
  2062. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2063. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2064. end
  2065. else
  2066. begin
  2067. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2068. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2069. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2070. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2071. end;
  2072. 3:
  2073. if aligned then
  2074. begin
  2075. srcref.offset:=2;
  2076. dstref.offset:=2;
  2077. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2078. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2079. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2080. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2081. end
  2082. else
  2083. begin
  2084. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2085. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2086. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2087. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2088. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2089. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2090. end;
  2091. end;
  2092. { keep the registers alive }
  2093. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2094. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2095. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2096. end;
  2097. { will never be called with count<=4 }
  2098. procedure genloop_thumb(count : aword;size : byte);
  2099. procedure refincofs(const ref : treference;const value : longint = 1);
  2100. begin
  2101. a_op_const_reg(list,OP_ADD,OS_ADDR,value,ref.base);
  2102. end;
  2103. const
  2104. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2105. var
  2106. l : tasmlabel;
  2107. begin
  2108. current_asmdata.getjumplabel(l);
  2109. if count<size then size:=1;
  2110. a_load_const_reg(list,OS_INT,count div size,countreg);
  2111. cg.a_label(list,l);
  2112. r:=getintregister(list,size2opsize[size]);
  2113. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2114. refincofs(srcref);
  2115. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2116. refincofs(dstref);
  2117. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2118. list.concat(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1));
  2119. a_jmp_flags(list,F_NE,l);
  2120. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2121. case count mod size of
  2122. 1:
  2123. begin
  2124. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2125. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2126. end;
  2127. 2:
  2128. if aligned then
  2129. begin
  2130. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2131. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2132. end
  2133. else
  2134. begin
  2135. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2136. refincofs(srcref);
  2137. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2138. refincofs(dstref);
  2139. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2140. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2141. end;
  2142. 3:
  2143. if aligned then
  2144. begin
  2145. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2146. refincofs(srcref,2);
  2147. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2148. refincofs(dstref,2);
  2149. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2150. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2151. end
  2152. else
  2153. begin
  2154. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2155. refincofs(srcref);
  2156. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2157. refincofs(dstref);
  2158. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2159. refincofs(srcref);
  2160. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2161. refincofs(dstref);
  2162. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2163. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2164. end;
  2165. end;
  2166. { keep the registers alive }
  2167. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2168. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2169. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2170. end;
  2171. begin
  2172. if len=0 then
  2173. exit;
  2174. if current_settings.cputype in cpu_thumb then
  2175. maxtmpreg:=maxtmpreg_thumb
  2176. else
  2177. maxtmpreg:=maxtmpreg_arm;
  2178. helpsize:=12+maxtmpreg*4;//52 with maxtmpreg=10
  2179. dstref:=dest;
  2180. srcref:=source;
  2181. if cs_opt_size in current_settings.optimizerswitches then
  2182. helpsize:=8;
  2183. if aligned and (len=4) then
  2184. begin
  2185. tmpreg:=getintregister(list,OS_32);
  2186. a_load_ref_reg(list,OS_32,OS_32,source,tmpreg);
  2187. a_load_reg_ref(list,OS_32,OS_32,tmpreg,dest);
  2188. end
  2189. else if aligned and (len=2) then
  2190. begin
  2191. tmpreg:=getintregister(list,OS_16);
  2192. a_load_ref_reg(list,OS_16,OS_16,source,tmpreg);
  2193. a_load_reg_ref(list,OS_16,OS_16,tmpreg,dest);
  2194. end
  2195. else if (len<=helpsize) and aligned then
  2196. begin
  2197. tmpregi:=0;
  2198. srcreg:=getintregister(list,OS_ADDR);
  2199. { explicit pc relative addressing, could be
  2200. e.g. a floating point constant }
  2201. if source.base=NR_PC then
  2202. begin
  2203. { ... then we don't need a loadaddr }
  2204. srcref:=source;
  2205. end
  2206. else
  2207. begin
  2208. a_loadaddr_ref_reg(list,source,srcreg);
  2209. reference_reset_base(srcref,srcreg,0,source.alignment);
  2210. end;
  2211. while (len div 4 <> 0) and (tmpregi<maxtmpreg) do
  2212. begin
  2213. inc(tmpregi);
  2214. tmpregisters[tmpregi]:=getintregister(list,OS_32);
  2215. a_load_ref_reg(list,OS_32,OS_32,srcref,tmpregisters[tmpregi]);
  2216. inc(srcref.offset,4);
  2217. dec(len,4);
  2218. end;
  2219. destreg:=getintregister(list,OS_ADDR);
  2220. a_loadaddr_ref_reg(list,dest,destreg);
  2221. reference_reset_base(dstref,destreg,0,dest.alignment);
  2222. tmpregi2:=1;
  2223. while (tmpregi2<=tmpregi) do
  2224. begin
  2225. a_load_reg_ref(list,OS_32,OS_32,tmpregisters[tmpregi2],dstref);
  2226. inc(dstref.offset,4);
  2227. inc(tmpregi2);
  2228. end;
  2229. copysize:=4;
  2230. cgsize:=OS_32;
  2231. while len<>0 do
  2232. begin
  2233. if len<2 then
  2234. begin
  2235. copysize:=1;
  2236. cgsize:=OS_8;
  2237. end
  2238. else if len<4 then
  2239. begin
  2240. copysize:=2;
  2241. cgsize:=OS_16;
  2242. end;
  2243. dec(len,copysize);
  2244. r:=getintregister(list,cgsize);
  2245. a_load_ref_reg(list,cgsize,cgsize,srcref,r);
  2246. a_load_reg_ref(list,cgsize,cgsize,r,dstref);
  2247. inc(srcref.offset,copysize);
  2248. inc(dstref.offset,copysize);
  2249. end;{end of while}
  2250. end
  2251. else
  2252. begin
  2253. cgsize:=OS_32;
  2254. if (len<=4) then{len<=4 and not aligned}
  2255. begin
  2256. r:=getintregister(list,cgsize);
  2257. usedtmpref:=a_internal_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2258. if Len=1 then
  2259. a_load_reg_ref(list,OS_8,OS_8,r,dstref)
  2260. else
  2261. begin
  2262. tmpreg:=getintregister(list,cgsize);
  2263. usedtmpref2:=a_internal_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2264. inc(usedtmpref.offset,1);
  2265. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2266. inc(usedtmpref2.offset,1);
  2267. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2268. if len>2 then
  2269. begin
  2270. inc(usedtmpref.offset,1);
  2271. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2272. inc(usedtmpref2.offset,1);
  2273. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2274. if len>3 then
  2275. begin
  2276. inc(usedtmpref.offset,1);
  2277. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2278. inc(usedtmpref2.offset,1);
  2279. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2280. end;
  2281. end;
  2282. end;
  2283. end{end of if len<=4}
  2284. else
  2285. begin{unaligned & 4<len<helpsize **or** aligned/unaligned & len>helpsize}
  2286. destreg:=getintregister(list,OS_ADDR);
  2287. a_loadaddr_ref_reg(list,dest,destreg);
  2288. reference_reset_base(dstref,destreg,0,dest.alignment);
  2289. srcreg:=getintregister(list,OS_ADDR);
  2290. a_loadaddr_ref_reg(list,source,srcreg);
  2291. reference_reset_base(srcref,srcreg,0,source.alignment);
  2292. countreg:=getintregister(list,OS_32);
  2293. // if cs_opt_size in current_settings.optimizerswitches then
  2294. { roozbeh : it seems loading 1 byte is faster becouse of caching/fetching(?) }
  2295. {if aligned then
  2296. genloop(len,4)
  2297. else}
  2298. if current_settings.cputype in cpu_thumb then
  2299. genloop_thumb(len,1)
  2300. else
  2301. genloop(len,1);
  2302. end;
  2303. end;
  2304. end;
  2305. procedure tbasecgarm.g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);
  2306. begin
  2307. g_concatcopy_internal(list,source,dest,len,false);
  2308. end;
  2309. procedure tbasecgarm.g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);
  2310. begin
  2311. if (source.alignment in [1,3]) or
  2312. (dest.alignment in [1,3]) then
  2313. g_concatcopy_internal(list,source,dest,len,false)
  2314. else
  2315. g_concatcopy_internal(list,source,dest,len,true);
  2316. end;
  2317. procedure tbasecgarm.g_overflowCheck(list : TAsmList;const l : tlocation;def : tdef);
  2318. var
  2319. ovloc : tlocation;
  2320. begin
  2321. ovloc.loc:=LOC_VOID;
  2322. g_overflowCheck_loc(list,l,def,ovloc);
  2323. end;
  2324. procedure tbasecgarm.g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);
  2325. var
  2326. hl : tasmlabel;
  2327. ai:TAiCpu;
  2328. hflags : tresflags;
  2329. begin
  2330. if not(cs_check_overflow in current_settings.localswitches) then
  2331. exit;
  2332. current_asmdata.getjumplabel(hl);
  2333. case ovloc.loc of
  2334. LOC_VOID:
  2335. begin
  2336. ai:=taicpu.op_sym(A_B,hl);
  2337. ai.is_jmp:=true;
  2338. if not((def.typ=pointerdef) or
  2339. ((def.typ=orddef) and
  2340. (torddef(def).ordtype in [u64bit,u16bit,u32bit,u8bit,uchar,
  2341. pasbool8,pasbool16,pasbool32,pasbool64]))) then
  2342. ai.SetCondition(C_VC)
  2343. else
  2344. if TAiCpu(List.Last).opcode in [A_RSB,A_RSC,A_SBC,A_SUB] then
  2345. ai.SetCondition(C_CS)
  2346. else
  2347. ai.SetCondition(C_CC);
  2348. list.concat(ai);
  2349. end;
  2350. LOC_FLAGS:
  2351. begin
  2352. hflags:=ovloc.resflags;
  2353. inverse_flags(hflags);
  2354. cg.a_jmp_flags(list,hflags,hl);
  2355. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2356. end;
  2357. else
  2358. internalerror(200409281);
  2359. end;
  2360. a_call_name(list,'FPC_OVERFLOW',false);
  2361. a_label(list,hl);
  2362. end;
  2363. procedure tbasecgarm.g_save_registers(list : TAsmList);
  2364. begin
  2365. { this work is done in g_proc_entry }
  2366. end;
  2367. procedure tbasecgarm.g_restore_registers(list : TAsmList);
  2368. begin
  2369. { this work is done in g_proc_exit }
  2370. end;
  2371. procedure tbasecgarm.a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  2372. var
  2373. ai : taicpu;
  2374. hlabel : TAsmLabel;
  2375. begin
  2376. if current_settings.cputype in cpu_thumb then
  2377. begin
  2378. { the optimizer has to fix this if jump range is sufficient short }
  2379. current_asmdata.getjumplabel(hlabel);
  2380. ai:=Taicpu.Op_sym(A_B,hlabel);
  2381. ai.SetCondition(inverse_cond(OpCmp2AsmCond[cond]));
  2382. ai.is_jmp:=true;
  2383. list.concat(ai);
  2384. a_jmp_always(list,l);
  2385. a_label(list,hlabel);
  2386. end
  2387. else
  2388. begin
  2389. ai:=Taicpu.Op_sym(A_B,l);
  2390. ai.SetCondition(OpCmp2AsmCond[cond]);
  2391. ai.is_jmp:=true;
  2392. list.concat(ai);
  2393. end;
  2394. end;
  2395. procedure tbasecgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  2396. var
  2397. hsym : tsym;
  2398. href : treference;
  2399. paraloc : Pcgparalocation;
  2400. shift : byte;
  2401. begin
  2402. { calculate the parameter info for the procdef }
  2403. procdef.init_paraloc_info(callerside);
  2404. hsym:=tsym(procdef.parast.Find('self'));
  2405. if not(assigned(hsym) and
  2406. (hsym.typ=paravarsym)) then
  2407. internalerror(200305251);
  2408. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  2409. while paraloc<>nil do
  2410. with paraloc^ do
  2411. begin
  2412. case loc of
  2413. LOC_REGISTER:
  2414. begin
  2415. if is_shifter_const(ioffset,shift) then
  2416. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  2417. else
  2418. begin
  2419. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  2420. a_op_reg_reg(list,OP_SUB,size,NR_R12,register);
  2421. end;
  2422. end;
  2423. LOC_REFERENCE:
  2424. begin
  2425. { offset in the wrapper needs to be adjusted for the stored
  2426. return address }
  2427. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),sizeof(pint));
  2428. if is_shifter_const(ioffset,shift) then
  2429. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  2430. else
  2431. begin
  2432. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  2433. a_op_reg_ref(list,OP_SUB,size,NR_R12,href);
  2434. end;
  2435. end
  2436. else
  2437. internalerror(200309189);
  2438. end;
  2439. paraloc:=next;
  2440. end;
  2441. end;
  2442. procedure tbasecgarm.g_stackpointer_alloc(list: TAsmList; size: longint);
  2443. begin
  2444. internalerror(200807237);
  2445. end;
  2446. function get_scalar_mm_op(fromsize,tosize : tcgsize) : tasmop;
  2447. const
  2448. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of tasmop = (
  2449. (A_FCPYS,A_FCVTSD,A_NONE,A_NONE,A_NONE),
  2450. (A_FCVTDS,A_FCPYD,A_NONE,A_NONE,A_NONE),
  2451. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2452. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2453. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE));
  2454. begin
  2455. result:=convertop[fromsize,tosize];
  2456. if result=A_NONE then
  2457. internalerror(200312205);
  2458. end;
  2459. procedure tbasecgarm.a_loadmm_reg_reg(list: tasmlist; fromsize,tosize: tcgsize; reg1,reg2: tregister; shuffle: pmmshuffle);
  2460. var
  2461. instr: taicpu;
  2462. begin
  2463. if shuffle=nil then
  2464. begin
  2465. if fromsize=tosize then
  2466. { needs correct size in case of spilling }
  2467. case fromsize of
  2468. OS_F32:
  2469. instr:=taicpu.op_reg_reg(A_FCPYS,reg2,reg1);
  2470. OS_F64:
  2471. instr:=taicpu.op_reg_reg(A_FCPYD,reg2,reg1);
  2472. else
  2473. internalerror(2009112405);
  2474. end
  2475. else
  2476. internalerror(2009112406);
  2477. end
  2478. else if shufflescalar(shuffle) then
  2479. instr:=taicpu.op_reg_reg(get_scalar_mm_op(tosize,fromsize),reg2,reg1)
  2480. else
  2481. internalerror(2009112407);
  2482. list.concat(instr);
  2483. case instr.opcode of
  2484. A_FCPYS,
  2485. A_FCPYD:
  2486. add_move_instruction(instr);
  2487. end;
  2488. end;
  2489. procedure tbasecgarm.a_loadmm_ref_reg(list: tasmlist; fromsize,tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  2490. var
  2491. intreg,
  2492. tmpmmreg : tregister;
  2493. reg64 : tregister64;
  2494. op : tasmop;
  2495. begin
  2496. if assigned(shuffle) and
  2497. not(shufflescalar(shuffle)) then
  2498. internalerror(2009112413);
  2499. case fromsize of
  2500. OS_32,OS_S32:
  2501. begin
  2502. fromsize:=OS_F32;
  2503. { since we are loading an integer, no conversion may be required }
  2504. if (fromsize<>tosize) then
  2505. internalerror(2009112801);
  2506. end;
  2507. OS_64,OS_S64:
  2508. begin
  2509. fromsize:=OS_F64;
  2510. { since we are loading an integer, no conversion may be required }
  2511. if (fromsize<>tosize) then
  2512. internalerror(2009112901);
  2513. end;
  2514. end;
  2515. if (fromsize<>tosize) then
  2516. tmpmmreg:=getmmregister(list,fromsize)
  2517. else
  2518. tmpmmreg:=reg;
  2519. if (ref.alignment in [1,2]) then
  2520. begin
  2521. case fromsize of
  2522. OS_F32:
  2523. begin
  2524. intreg:=getintregister(list,OS_32);
  2525. a_load_ref_reg(list,OS_32,OS_32,ref,intreg);
  2526. a_loadmm_intreg_reg(list,OS_32,OS_F32,intreg,tmpmmreg,mms_movescalar);
  2527. end;
  2528. OS_F64:
  2529. begin
  2530. reg64.reglo:=getintregister(list,OS_32);
  2531. reg64.reghi:=getintregister(list,OS_32);
  2532. cg64.a_load64_ref_reg(list,ref,reg64);
  2533. cg64.a_loadmm_intreg64_reg(list,OS_F64,reg64,tmpmmreg);
  2534. end;
  2535. else
  2536. internalerror(2009112412);
  2537. end;
  2538. end
  2539. else
  2540. begin
  2541. case fromsize of
  2542. OS_F32:
  2543. op:=A_FLDS;
  2544. OS_F64:
  2545. op:=A_FLDD;
  2546. else
  2547. internalerror(2009112415);
  2548. end;
  2549. handle_load_store(list,op,PF_None,tmpmmreg,ref);
  2550. end;
  2551. if (tmpmmreg<>reg) then
  2552. a_loadmm_reg_reg(list,fromsize,tosize,tmpmmreg,reg,shuffle);
  2553. end;
  2554. procedure tbasecgarm.a_loadmm_reg_ref(list: tasmlist; fromsize,tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  2555. var
  2556. intreg,
  2557. tmpmmreg : tregister;
  2558. reg64 : tregister64;
  2559. op : tasmop;
  2560. begin
  2561. if assigned(shuffle) and
  2562. not(shufflescalar(shuffle)) then
  2563. internalerror(2009112416);
  2564. case tosize of
  2565. OS_32,OS_S32:
  2566. begin
  2567. tosize:=OS_F32;
  2568. { since we are loading an integer, no conversion may be required }
  2569. if (fromsize<>tosize) then
  2570. internalerror(2009112801);
  2571. end;
  2572. OS_64,OS_S64:
  2573. begin
  2574. tosize:=OS_F64;
  2575. { since we are loading an integer, no conversion may be required }
  2576. if (fromsize<>tosize) then
  2577. internalerror(2009112901);
  2578. end;
  2579. end;
  2580. if (fromsize<>tosize) then
  2581. begin
  2582. tmpmmreg:=getmmregister(list,tosize);
  2583. a_loadmm_reg_reg(list,fromsize,tosize,reg,tmpmmreg,shuffle);
  2584. end
  2585. else
  2586. tmpmmreg:=reg;
  2587. if (ref.alignment in [1,2]) then
  2588. begin
  2589. case tosize of
  2590. OS_F32:
  2591. begin
  2592. intreg:=getintregister(list,OS_32);
  2593. a_loadmm_reg_intreg(list,OS_F32,OS_32,tmpmmreg,intreg,shuffle);
  2594. a_load_reg_ref(list,OS_32,OS_32,intreg,ref);
  2595. end;
  2596. OS_F64:
  2597. begin
  2598. reg64.reglo:=getintregister(list,OS_32);
  2599. reg64.reghi:=getintregister(list,OS_32);
  2600. cg64.a_loadmm_reg_intreg64(list,OS_F64,tmpmmreg,reg64);
  2601. cg64.a_load64_reg_ref(list,reg64,ref);
  2602. end;
  2603. else
  2604. internalerror(2009112417);
  2605. end;
  2606. end
  2607. else
  2608. begin
  2609. case fromsize of
  2610. OS_F32:
  2611. op:=A_FSTS;
  2612. OS_F64:
  2613. op:=A_FSTD;
  2614. else
  2615. internalerror(2009112418);
  2616. end;
  2617. handle_load_store(list,op,PF_None,tmpmmreg,ref);
  2618. end;
  2619. end;
  2620. procedure tbasecgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  2621. begin
  2622. { this code can only be used to transfer raw data, not to perform
  2623. conversions }
  2624. if (tosize<>OS_F32) then
  2625. internalerror(2009112419);
  2626. if not(fromsize in [OS_32,OS_S32]) then
  2627. internalerror(2009112420);
  2628. if assigned(shuffle) and
  2629. not shufflescalar(shuffle) then
  2630. internalerror(2009112516);
  2631. list.concat(taicpu.op_reg_reg(A_FMSR,mmreg,intreg));
  2632. end;
  2633. procedure tbasecgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize; mmreg, intreg: tregister;shuffle : pmmshuffle);
  2634. begin
  2635. { this code can only be used to transfer raw data, not to perform
  2636. conversions }
  2637. if (fromsize<>OS_F32) then
  2638. internalerror(2009112430);
  2639. if not(tosize in [OS_32,OS_S32]) then
  2640. internalerror(2009112420);
  2641. if assigned(shuffle) and
  2642. not shufflescalar(shuffle) then
  2643. internalerror(2009112514);
  2644. list.concat(taicpu.op_reg_reg(A_FMRS,intreg,mmreg));
  2645. end;
  2646. procedure tbasecgarm.a_opmm_reg_reg(list: tasmlist; op: topcg; size: tcgsize; src, dst: tregister; shuffle: pmmshuffle);
  2647. var
  2648. tmpreg: tregister;
  2649. begin
  2650. { the vfp doesn't support xor nor any other logical operation, but
  2651. this routine is used to initialise global mm regvars. We can
  2652. easily initialise an mm reg with 0 though. }
  2653. case op of
  2654. OP_XOR:
  2655. begin
  2656. if (src<>dst) or
  2657. (reg_cgsize(src)<>size) or
  2658. assigned(shuffle) then
  2659. internalerror(2009112907);
  2660. tmpreg:=getintregister(list,OS_32);
  2661. a_load_const_reg(list,OS_32,0,tmpreg);
  2662. case size of
  2663. OS_F32:
  2664. list.concat(taicpu.op_reg_reg(A_FMSR,dst,tmpreg));
  2665. OS_F64:
  2666. list.concat(taicpu.op_reg_reg_reg(A_FMDRR,dst,tmpreg,tmpreg));
  2667. else
  2668. internalerror(2009112908);
  2669. end;
  2670. end
  2671. else
  2672. internalerror(2009112906);
  2673. end;
  2674. end;
  2675. procedure tbasecgarm.g_intf_wrapper(list: TAsmList; procdef: tprocdef; const labelname: string; ioffset: longint);
  2676. procedure loadvmttor12;
  2677. var
  2678. href : treference;
  2679. begin
  2680. reference_reset_base(href,NR_R0,0,sizeof(pint));
  2681. if current_settings.cputype in cpu_thumb then
  2682. begin
  2683. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R0]));
  2684. cg.a_load_ref_reg(list,OS_ADDR,OS_ADDR,href,NR_R0);
  2685. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_R0));
  2686. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R0]));
  2687. end
  2688. else
  2689. cg.a_load_ref_reg(list,OS_ADDR,OS_ADDR,href,NR_R12);
  2690. end;
  2691. procedure op_onr12methodaddr;
  2692. var
  2693. href : treference;
  2694. begin
  2695. if (procdef.extnumber=$ffff) then
  2696. Internalerror(200006139);
  2697. if current_settings.cputype in cpu_thumb then
  2698. begin
  2699. reference_reset_base(href,NR_R0,tobjectdef(procdef.struct).vmtmethodoffset(procdef.extnumber),sizeof(pint));
  2700. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R0]));
  2701. cg.a_load_ref_reg(list,OS_ADDR,OS_ADDR,href,NR_R0);
  2702. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_R0));
  2703. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R0]));
  2704. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R12));
  2705. end
  2706. else
  2707. begin
  2708. reference_reset_base(href,NR_R12,tobjectdef(procdef.struct).vmtmethodoffset(procdef.extnumber),sizeof(pint));
  2709. cg.a_load_ref_reg(list,OS_ADDR,OS_ADDR,href,NR_R12);
  2710. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R12));
  2711. end;
  2712. end;
  2713. var
  2714. make_global : boolean;
  2715. begin
  2716. if not(procdef.proctypeoption in [potype_function,potype_procedure]) then
  2717. Internalerror(200006137);
  2718. if not assigned(procdef.struct) or
  2719. (procdef.procoptions*[po_classmethod, po_staticmethod,
  2720. po_methodpointer, po_interrupt, po_iocheck]<>[]) then
  2721. Internalerror(200006138);
  2722. if procdef.owner.symtabletype<>ObjectSymtable then
  2723. Internalerror(200109191);
  2724. make_global:=false;
  2725. if (not current_module.is_unit) or
  2726. create_smartlink or
  2727. (procdef.owner.defowner.owner.symtabletype=globalsymtable) then
  2728. make_global:=true;
  2729. if make_global then
  2730. list.concat(Tai_symbol.Createname_global(labelname,AT_FUNCTION,0))
  2731. else
  2732. list.concat(Tai_symbol.Createname(labelname,AT_FUNCTION,0));
  2733. { the wrapper might need aktlocaldata for the additional data to
  2734. load the constant }
  2735. current_procinfo:=cprocinfo.create(nil);
  2736. { set param1 interface to self }
  2737. g_adjust_self_value(list,procdef,ioffset);
  2738. { case 4 }
  2739. if (po_virtualmethod in procdef.procoptions) and
  2740. not is_objectpascal_helper(procdef.struct) then
  2741. begin
  2742. loadvmttor12;
  2743. op_onr12methodaddr;
  2744. end
  2745. { case 0 }
  2746. else
  2747. list.concat(taicpu.op_sym(A_B,current_asmdata.RefAsmSymbol(procdef.mangledname)));
  2748. list.concatlist(current_procinfo.aktlocaldata);
  2749. current_procinfo.Free;
  2750. current_procinfo:=nil;
  2751. list.concat(Tai_symbol_end.Createname(labelname));
  2752. end;
  2753. procedure tbasecgarm.maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  2754. const
  2755. overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NEG];
  2756. begin
  2757. if (op in overflowops) and
  2758. (size in [OS_8,OS_S8,OS_16,OS_S16]) then
  2759. a_load_reg_reg(list,OS_32,size,dst,dst);
  2760. end;
  2761. function tbasecgarm.get_darwin_call_stub(const s: string; weak: boolean): tasmsymbol;
  2762. var
  2763. stubname: string;
  2764. l1: tasmsymbol;
  2765. href: treference;
  2766. begin
  2767. stubname := 'L'+s+'$stub';
  2768. result := current_asmdata.getasmsymbol(stubname);
  2769. if assigned(result) then
  2770. exit;
  2771. if current_asmdata.asmlists[al_imports]=nil then
  2772. current_asmdata.asmlists[al_imports]:=TAsmList.create;
  2773. new_section(current_asmdata.asmlists[al_imports],sec_stub,'',4);
  2774. result := current_asmdata.RefAsmSymbol(stubname);
  2775. current_asmdata.asmlists[al_imports].concat(Tai_symbol.Create(result,0));
  2776. { register as a weak symbol if necessary }
  2777. if weak then
  2778. current_asmdata.weakrefasmsymbol(s);
  2779. current_asmdata.asmlists[al_imports].concat(tai_directive.create(asd_indirect_symbol,s));
  2780. if not(cs_create_pic in current_settings.moduleswitches) then
  2781. begin
  2782. l1 := current_asmdata.RefAsmSymbol('L'+s+'$slp');
  2783. reference_reset_symbol(href,l1,0,sizeof(pint));
  2784. href.refaddr:=addr_full;
  2785. current_asmdata.asmlists[al_imports].concat(taicpu.op_reg_ref(A_LDR,NR_R12,href));
  2786. reference_reset_base(href,NR_R12,0,sizeof(pint));
  2787. current_asmdata.asmlists[al_imports].concat(taicpu.op_reg_ref(A_LDR,NR_R15,href));
  2788. current_asmdata.asmlists[al_imports].concat(Tai_symbol.Create(l1,0));
  2789. l1 := current_asmdata.RefAsmSymbol('L'+s+'$lazy_ptr');
  2790. current_asmdata.asmlists[al_imports].concat(tai_const.create_sym(l1));
  2791. end
  2792. else
  2793. internalerror(2008100401);
  2794. new_section(current_asmdata.asmlists[al_imports],sec_data_lazy,'',sizeof(pint));
  2795. current_asmdata.asmlists[al_imports].concat(Tai_symbol.Create(l1,0));
  2796. current_asmdata.asmlists[al_imports].concat(tai_directive.create(asd_indirect_symbol,s));
  2797. current_asmdata.asmlists[al_imports].concat(tai_const.createname('dyld_stub_binding_helper',0));
  2798. end;
  2799. procedure tcg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  2800. begin
  2801. case op of
  2802. OP_NEG:
  2803. begin
  2804. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2805. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  2806. list.concat(taicpu.op_reg_reg_const(A_RSC,regdst.reghi,regsrc.reghi,0));
  2807. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2808. end;
  2809. OP_NOT:
  2810. begin
  2811. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  2812. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  2813. end;
  2814. else
  2815. a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);
  2816. end;
  2817. end;
  2818. procedure tcg64farm.a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);
  2819. begin
  2820. a_op64_const_reg_reg(list,op,size,value,reg,reg);
  2821. end;
  2822. procedure tcg64farm.a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);
  2823. var
  2824. ovloc : tlocation;
  2825. begin
  2826. a_op64_const_reg_reg_checkoverflow(list,op,size,value,regsrc,regdst,false,ovloc);
  2827. end;
  2828. procedure tcg64farm.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);
  2829. var
  2830. ovloc : tlocation;
  2831. begin
  2832. a_op64_reg_reg_reg_checkoverflow(list,op,size,regsrc1,regsrc2,regdst,false,ovloc);
  2833. end;
  2834. procedure tcg64farm.a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);
  2835. begin
  2836. { this code can only be used to transfer raw data, not to perform
  2837. conversions }
  2838. if (mmsize<>OS_F64) then
  2839. internalerror(2009112405);
  2840. list.concat(taicpu.op_reg_reg_reg(A_FMDRR,mmreg,intreg.reglo,intreg.reghi));
  2841. end;
  2842. procedure tcg64farm.a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);
  2843. begin
  2844. { this code can only be used to transfer raw data, not to perform
  2845. conversions }
  2846. if (mmsize<>OS_F64) then
  2847. internalerror(2009112406);
  2848. list.concat(taicpu.op_reg_reg_reg(A_FMRRD,intreg.reglo,intreg.reghi,mmreg));
  2849. end;
  2850. procedure tcg64farm.a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  2851. var
  2852. tmpreg : tregister;
  2853. b : byte;
  2854. begin
  2855. ovloc.loc:=LOC_VOID;
  2856. case op of
  2857. OP_NEG,
  2858. OP_NOT :
  2859. internalerror(2012022501);
  2860. end;
  2861. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  2862. begin
  2863. case op of
  2864. OP_ADD:
  2865. begin
  2866. if is_shifter_const(lo(value),b) then
  2867. begin
  2868. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2869. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  2870. end
  2871. else
  2872. begin
  2873. tmpreg:=cg.getintregister(list,OS_32);
  2874. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  2875. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2876. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  2877. end;
  2878. if is_shifter_const(hi(value),b) then
  2879. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,hi(value)),PF_S))
  2880. else
  2881. begin
  2882. tmpreg:=cg.getintregister(list,OS_32);
  2883. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  2884. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  2885. end;
  2886. end;
  2887. OP_SUB:
  2888. begin
  2889. if is_shifter_const(lo(value),b) then
  2890. begin
  2891. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2892. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  2893. end
  2894. else
  2895. begin
  2896. tmpreg:=cg.getintregister(list,OS_32);
  2897. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  2898. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2899. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  2900. end;
  2901. if is_shifter_const(hi(value),b) then
  2902. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))),PF_S))
  2903. else
  2904. begin
  2905. tmpreg:=cg.getintregister(list,OS_32);
  2906. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  2907. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  2908. end;
  2909. end;
  2910. else
  2911. internalerror(200502131);
  2912. end;
  2913. if size=OS_64 then
  2914. begin
  2915. { the arm has an weired opinion how flags for SUB/ADD are handled }
  2916. ovloc.loc:=LOC_FLAGS;
  2917. case op of
  2918. OP_ADD:
  2919. ovloc.resflags:=F_CS;
  2920. OP_SUB:
  2921. ovloc.resflags:=F_CC;
  2922. end;
  2923. end;
  2924. end
  2925. else
  2926. begin
  2927. case op of
  2928. OP_AND,OP_OR,OP_XOR:
  2929. begin
  2930. cg.a_op_const_reg_reg(list,op,OS_32,aint(lo(value)),regsrc.reglo,regdst.reglo);
  2931. cg.a_op_const_reg_reg(list,op,OS_32,aint(hi(value)),regsrc.reghi,regdst.reghi);
  2932. end;
  2933. OP_ADD:
  2934. begin
  2935. if is_shifter_const(aint(lo(value)),b) then
  2936. begin
  2937. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2938. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  2939. end
  2940. else
  2941. begin
  2942. tmpreg:=cg.getintregister(list,OS_32);
  2943. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  2944. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2945. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  2946. end;
  2947. if is_shifter_const(aint(hi(value)),b) then
  2948. list.concat(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  2949. else
  2950. begin
  2951. tmpreg:=cg.getintregister(list,OS_32);
  2952. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  2953. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg));
  2954. end;
  2955. end;
  2956. OP_SUB:
  2957. begin
  2958. if is_shifter_const(aint(lo(value)),b) then
  2959. begin
  2960. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2961. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  2962. end
  2963. else
  2964. begin
  2965. tmpreg:=cg.getintregister(list,OS_32);
  2966. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  2967. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2968. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  2969. end;
  2970. if is_shifter_const(aint(hi(value)),b) then
  2971. list.concat(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  2972. else
  2973. begin
  2974. tmpreg:=cg.getintregister(list,OS_32);
  2975. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  2976. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg));
  2977. end;
  2978. end;
  2979. else
  2980. internalerror(2003083101);
  2981. end;
  2982. end;
  2983. end;
  2984. procedure tcg64farm.a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  2985. begin
  2986. ovloc.loc:=LOC_VOID;
  2987. case op of
  2988. OP_NEG,
  2989. OP_NOT :
  2990. internalerror(2012022502);
  2991. end;
  2992. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  2993. begin
  2994. case op of
  2995. OP_ADD:
  2996. begin
  2997. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2998. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  2999. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi),PF_S));
  3000. end;
  3001. OP_SUB:
  3002. begin
  3003. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3004. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3005. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi),PF_S));
  3006. end;
  3007. else
  3008. internalerror(2003083101);
  3009. end;
  3010. if size=OS_64 then
  3011. begin
  3012. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3013. ovloc.loc:=LOC_FLAGS;
  3014. case op of
  3015. OP_ADD:
  3016. ovloc.resflags:=F_CS;
  3017. OP_SUB:
  3018. ovloc.resflags:=F_CC;
  3019. end;
  3020. end;
  3021. end
  3022. else
  3023. begin
  3024. case op of
  3025. OP_AND,OP_OR,OP_XOR:
  3026. begin
  3027. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);
  3028. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);
  3029. end;
  3030. OP_ADD:
  3031. begin
  3032. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3033. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3034. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi));
  3035. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3036. end;
  3037. OP_SUB:
  3038. begin
  3039. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3040. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3041. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi));
  3042. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3043. end;
  3044. else
  3045. internalerror(2003083101);
  3046. end;
  3047. end;
  3048. end;
  3049. procedure tthumbcgarm.init_register_allocators;
  3050. begin
  3051. inherited init_register_allocators;
  3052. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3053. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7],first_int_imreg,[]);
  3054. { rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  3055. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  3056. if current_settings.fputype=fpu_fpv4_s16 then
  3057. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3058. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3059. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3060. ],first_mm_imreg,[])
  3061. else
  3062. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBNONE,
  3063. [RS_S0,RS_S1,RS_R2,RS_R3,RS_R4,RS_S31],first_mm_imreg,[]);
  3064. }
  3065. end;
  3066. procedure tthumbcgarm.done_register_allocators;
  3067. begin
  3068. rg[R_INTREGISTER].free;
  3069. rg[R_FPUREGISTER].free;
  3070. rg[R_MMREGISTER].free;
  3071. inherited done_register_allocators;
  3072. end;
  3073. procedure tthumbcgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  3074. var
  3075. ref : treference;
  3076. shift : byte;
  3077. r : byte;
  3078. regs, saveregs : tcpuregisterset;
  3079. r7offset,
  3080. stackmisalignment : pint;
  3081. postfix: toppostfix;
  3082. imm1, imm2: DWord;
  3083. begin
  3084. LocalSize:=align(LocalSize,4);
  3085. { call instruction does not put anything on the stack }
  3086. stackmisalignment:=0;
  3087. if not(nostackframe) then
  3088. begin
  3089. a_reg_alloc(list,NR_STACK_POINTER_REG);
  3090. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3091. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  3092. { save int registers }
  3093. reference_reset(ref,4);
  3094. ref.index:=NR_STACK_POINTER_REG;
  3095. ref.addressmode:=AM_PREINDEXED;
  3096. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3097. a_reg_alloc(list,NR_STACK_POINTER_REG);
  3098. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3099. begin
  3100. //!!!! a_reg_alloc(list,NR_R12);
  3101. //!!!! list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  3102. end;
  3103. { the (old) ARM APCS requires saving both the stack pointer (to
  3104. crawl the stack) and the PC (to identify the function this
  3105. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  3106. and R15 -- still needs updating for EABI and Darwin, they don't
  3107. need that }
  3108. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3109. regs:=regs+[RS_R7,RS_R14]
  3110. else
  3111. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  3112. include(regs,RS_R14);
  3113. { safely estimate stack size }
  3114. if localsize+current_settings.alignment.localalignmax>508 then
  3115. include(regs,RS_R4);
  3116. if regs<>[] then
  3117. begin
  3118. for r:=RS_R0 to RS_R15 do
  3119. if r in regs then
  3120. inc(stackmisalignment,4);
  3121. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,regs));
  3122. end;
  3123. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3124. begin
  3125. { the framepointer now points to the saved R15, so the saved
  3126. framepointer is at R11-12 (for get_caller_frame) }
  3127. //!!! list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  3128. //!!! a_reg_dealloc(list,NR_R12);
  3129. end;
  3130. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  3131. if (LocalSize<>0) or
  3132. ((stackmisalignment<>0) and
  3133. ((pi_do_call in current_procinfo.flags) or
  3134. (po_assembler in current_procinfo.procdef.procoptions))) then
  3135. begin
  3136. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3137. if localsize<508 then
  3138. begin
  3139. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  3140. end
  3141. else
  3142. begin
  3143. a_load_const_reg(list,OS_ADDR,-localsize,NR_R4);
  3144. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R4));
  3145. //!!!! if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  3146. //!!!! a_reg_alloc(list,NR_R12);
  3147. //!!!! a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  3148. //!!!! list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  3149. //!!!! a_reg_dealloc(list,NR_R12);
  3150. end;
  3151. end;
  3152. end;
  3153. end;
  3154. procedure tthumbcgarm.g_proc_exit(list: TAsmList; parasize: longint; nostackframe: boolean);
  3155. var
  3156. ref : treference;
  3157. LocalSize : longint;
  3158. r,
  3159. shift : byte;
  3160. saveregs,
  3161. regs : tcpuregisterset;
  3162. stackmisalignment: pint;
  3163. imm1, imm2: DWord;
  3164. begin
  3165. if not(nostackframe) then
  3166. begin
  3167. stackmisalignment:=0;
  3168. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall) ;
  3169. include(regs,RS_R15);
  3170. for r:=RS_R0 to RS_R15 do
  3171. if r in regs then
  3172. inc(stackmisalignment,4);
  3173. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  3174. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  3175. (target_info.system in systems_darwin) then
  3176. begin
  3177. LocalSize:=current_procinfo.calc_stackframe_size;
  3178. if (LocalSize<>0) or
  3179. ((stackmisalignment<>0) and
  3180. ((pi_do_call in current_procinfo.flags) or
  3181. (po_assembler in current_procinfo.procdef.procoptions))) then
  3182. begin
  3183. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3184. if is_shifter_const(LocalSize,shift) then
  3185. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  3186. else if split_into_shifter_const(localsize, imm1, imm2) then
  3187. begin
  3188. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  3189. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  3190. end
  3191. else
  3192. begin
  3193. a_reg_alloc(list,NR_R12);
  3194. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  3195. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  3196. a_reg_dealloc(list,NR_R12);
  3197. end;
  3198. end;
  3199. if regs=[] then
  3200. begin
  3201. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3202. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3203. else
  3204. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3205. end
  3206. else
  3207. begin
  3208. reference_reset(ref,4);
  3209. ref.index:=NR_STACK_POINTER_REG;
  3210. ref.addressmode:=AM_PREINDEXED;
  3211. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,regs));
  3212. end;
  3213. end
  3214. else
  3215. begin
  3216. { restore int registers and return }
  3217. reference_reset(ref,4);
  3218. ref.index:=NR_FRAME_POINTER_REG;
  3219. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,regs));
  3220. end;
  3221. end
  3222. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3223. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3224. else
  3225. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3226. end;
  3227. procedure tthumbcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3228. var
  3229. oppostfix:toppostfix;
  3230. usedtmpref: treference;
  3231. tmpreg,tmpreg2 : tregister;
  3232. dir : integer;
  3233. begin
  3234. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3235. FromSize := ToSize;
  3236. case FromSize of
  3237. { signed integer registers }
  3238. OS_8:
  3239. oppostfix:=PF_B;
  3240. OS_S8:
  3241. oppostfix:=PF_SB;
  3242. OS_16:
  3243. oppostfix:=PF_H;
  3244. OS_S16:
  3245. oppostfix:=PF_SH;
  3246. OS_32,
  3247. OS_S32:
  3248. oppostfix:=PF_None;
  3249. else
  3250. InternalError(200308297);
  3251. end;
  3252. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3253. begin
  3254. if target_info.endian=endian_big then
  3255. dir:=-1
  3256. else
  3257. dir:=1;
  3258. case FromSize of
  3259. OS_16,OS_S16:
  3260. begin
  3261. { only complicated references need an extra loadaddr }
  3262. if assigned(ref.symbol) or
  3263. (ref.index<>NR_NO) or
  3264. (ref.offset<-255) or
  3265. (ref.offset>4094) or
  3266. { sometimes the compiler reused registers }
  3267. (reg=ref.index) or
  3268. (reg=ref.base) then
  3269. begin
  3270. tmpreg2:=getintregister(list,OS_INT);
  3271. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3272. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3273. end
  3274. else
  3275. usedtmpref:=ref;
  3276. if target_info.endian=endian_big then
  3277. inc(usedtmpref.offset,1);
  3278. tmpreg:=getintregister(list,OS_INT);
  3279. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3280. inc(usedtmpref.offset,dir);
  3281. if FromSize=OS_16 then
  3282. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3283. else
  3284. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3285. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3286. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3287. end;
  3288. OS_32,OS_S32:
  3289. begin
  3290. tmpreg:=getintregister(list,OS_INT);
  3291. { only complicated references need an extra loadaddr }
  3292. if assigned(ref.symbol) or
  3293. (ref.index<>NR_NO) or
  3294. (ref.offset<-255) or
  3295. (ref.offset>4092) or
  3296. { sometimes the compiler reused registers }
  3297. (reg=ref.index) or
  3298. (reg=ref.base) then
  3299. begin
  3300. tmpreg2:=getintregister(list,OS_INT);
  3301. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3302. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3303. end
  3304. else
  3305. usedtmpref:=ref;
  3306. if ref.alignment=2 then
  3307. begin
  3308. if target_info.endian=endian_big then
  3309. inc(usedtmpref.offset,2);
  3310. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  3311. inc(usedtmpref.offset,dir*2);
  3312. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  3313. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3314. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3315. end
  3316. else
  3317. begin
  3318. if target_info.endian=endian_big then
  3319. inc(usedtmpref.offset,3);
  3320. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3321. inc(usedtmpref.offset,dir);
  3322. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3323. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3324. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3325. inc(usedtmpref.offset,dir);
  3326. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3327. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3328. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3329. inc(usedtmpref.offset,dir);
  3330. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3331. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,24));
  3332. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3333. end;
  3334. end
  3335. else
  3336. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3337. end;
  3338. end
  3339. else
  3340. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3341. if (fromsize=OS_S8) and (tosize = OS_16) then
  3342. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  3343. end;
  3344. procedure tthumbcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3345. var
  3346. imm_shift : byte;
  3347. l : tasmlabel;
  3348. hr : treference;
  3349. begin
  3350. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3351. internalerror(2002090902);
  3352. if is_thumb_imm(a) then
  3353. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3354. else
  3355. begin
  3356. reference_reset(hr,4);
  3357. current_asmdata.getjumplabel(l);
  3358. cg.a_label(current_procinfo.aktlocaldata,l);
  3359. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3360. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3361. hr.symbol:=l;
  3362. hr.base:=NR_PC;
  3363. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3364. end;
  3365. end;
  3366. procedure tthumbcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  3367. var
  3368. tmpreg,overflowreg : tregister;
  3369. asmop : tasmop;
  3370. begin
  3371. case op of
  3372. OP_NEG:
  3373. list.concat(taicpu.op_reg_reg(A_NEG,dst,src));
  3374. OP_NOT:
  3375. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  3376. OP_DIV,OP_IDIV:
  3377. internalerror(200308281);
  3378. OP_ROL:
  3379. begin
  3380. if not(size in [OS_32,OS_S32]) then
  3381. internalerror(2008072801);
  3382. { simulate ROL by ror'ing 32-value }
  3383. tmpreg:=getintregister(list,OS_32);
  3384. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,tmpreg,src,32),PF_S));
  3385. list.concat(taicpu.op_reg_reg(A_ROR,dst,src));
  3386. end;
  3387. else
  3388. begin
  3389. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3390. list.concat(setoppostfix(
  3391. taicpu.op_reg_reg(op_reg_opcg2asmop[op],dst,src),op_reg_postfix[op]));
  3392. end;
  3393. end;
  3394. maybeadjustresult(list,op,size,dst);
  3395. end;
  3396. procedure tthumbcgarm.a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);
  3397. var
  3398. tmpreg : tregister;
  3399. so : tshifterop;
  3400. l1 : longint;
  3401. imm1, imm2: DWord;
  3402. begin
  3403. //!!! ovloc.loc:=LOC_VOID;
  3404. if {$ifopt R+}(a<>-2147483648) and{$endif} {!!!!!! not setflags and } is_thumb_imm(-a) then
  3405. case op of
  3406. OP_ADD:
  3407. begin
  3408. op:=OP_SUB;
  3409. a:=aint(dword(-a));
  3410. end;
  3411. OP_SUB:
  3412. begin
  3413. op:=OP_ADD;
  3414. a:=aint(dword(-a));
  3415. end
  3416. end;
  3417. if is_thumb_imm(a) and not(op in [OP_IMUL,OP_MUL,OP_AND,OP_OR,OP_XOR]) then
  3418. case op of
  3419. OP_NEG:
  3420. list.concat(taicpu.op_reg_const(A_NEG,dst,a));
  3421. OP_NOT:
  3422. list.concat(taicpu.op_reg_const(A_MVN,dst,a));
  3423. OP_ROL:
  3424. begin
  3425. if not(size in [OS_32,OS_S32]) then
  3426. internalerror(2008072801);
  3427. list.concat(taicpu.op_reg_const(A_ROR,dst,a));
  3428. end;
  3429. else
  3430. begin
  3431. // if cgsetflags or setflags then
  3432. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3433. list.concat(setoppostfix(
  3434. taicpu.op_reg_const(op_reg_opcg2asmop[op],dst,a),op_reg_postfix[op]));
  3435. end;
  3436. if (cgsetflags {!!! or setflags }) and (size in [OS_8,OS_16,OS_32]) then
  3437. begin
  3438. //!!! ovloc.loc:=LOC_FLAGS;
  3439. case op of
  3440. OP_ADD:
  3441. //!!! ovloc.resflags:=F_CS;
  3442. ;
  3443. OP_SUB:
  3444. //!!! ovloc.resflags:=F_CC;
  3445. ;
  3446. end;
  3447. end;
  3448. end
  3449. else
  3450. begin
  3451. { there could be added some more sophisticated optimizations }
  3452. if (op in [OP_MUL,OP_IMUL,OP_DIV,OP_IDIV]) and (a=1) then
  3453. a_load_reg_reg(list,size,size,dst,dst)
  3454. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  3455. a_load_const_reg(list,size,0,dst)
  3456. else if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  3457. a_op_reg_reg(list,OP_NEG,size,dst,dst)
  3458. { we do this here instead in the peephole optimizer because
  3459. it saves us a register }
  3460. {$ifdef DUMMY}
  3461. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  3462. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  3463. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  3464. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  3465. begin
  3466. if l1>32 then{roozbeh does this ever happen?}
  3467. internalerror(200308296);
  3468. shifterop_reset(so);
  3469. so.shiftmode:=SM_LSL;
  3470. so.shiftimm:=l1;
  3471. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  3472. end
  3473. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  3474. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  3475. begin
  3476. if l1>32 then{does this ever happen?}
  3477. internalerror(201205181);
  3478. shifterop_reset(so);
  3479. so.shiftmode:=SM_LSL;
  3480. so.shiftimm:=l1;
  3481. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  3482. end
  3483. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  3484. begin
  3485. { nothing to do on success }
  3486. end
  3487. {$endif DUMMY}
  3488. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  3489. Just using mov x, #0 might allow some easier optimizations down the line. }
  3490. else if (op = OP_AND) and (dword(a)=0) then
  3491. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  3492. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  3493. else if (op = OP_AND) and (not(dword(a))=0) then
  3494. // do nothing
  3495. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  3496. broader range of shifterconstants.}
  3497. {$ifdef DUMMY}
  3498. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  3499. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  3500. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  3501. begin
  3502. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,imm1));
  3503. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  3504. end
  3505. else if (op in [OP_ADD, OP_SUB, OP_OR]) and
  3506. not(cgsetflags or setflags) and
  3507. split_into_shifter_const(a, imm1, imm2) then
  3508. begin
  3509. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,imm1));
  3510. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  3511. end
  3512. {$endif DUMMY}
  3513. else
  3514. begin
  3515. tmpreg:=getintregister(list,size);
  3516. a_load_const_reg(list,size,a,tmpreg);
  3517. a_op_reg_reg(list,op,size,tmpreg,dst);
  3518. end;
  3519. end;
  3520. maybeadjustresult(list,op,size,dst);
  3521. end;
  3522. procedure tthumbcgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  3523. var
  3524. l : tasmlabel;
  3525. ai : taicpu;
  3526. begin
  3527. current_asmdata.getjumplabel(l);
  3528. list.concat(taicpu.op_reg_const(A_MOV,reg,1));
  3529. ai:=setcondition(taicpu.op_sym(A_B,l),flags_to_cond(f));
  3530. ai.is_jmp:=true;
  3531. list.concat(ai);
  3532. list.concat(taicpu.op_reg_const(A_MOV,reg,0));
  3533. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3534. cg.a_label(list,l);
  3535. end;
  3536. procedure tthumb2cgarm.init_register_allocators;
  3537. begin
  3538. inherited init_register_allocators;
  3539. { currently, we save R14 always, so we can use it }
  3540. if (target_info.system<>system_arm_darwin) then
  3541. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3542. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3543. RS_R9,RS_R10,RS_R12,RS_R14],first_int_imreg,[])
  3544. else
  3545. { r9 is not available on Darwin according to the llvm code generator }
  3546. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3547. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3548. RS_R10,RS_R12,RS_R14],first_int_imreg,[]);
  3549. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  3550. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  3551. if current_settings.fputype=fpu_fpv4_s16 then
  3552. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3553. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3554. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3555. ],first_mm_imreg,[])
  3556. else
  3557. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBNONE,
  3558. [RS_S0,RS_S1,RS_R2,RS_R3,RS_R4,RS_S31],first_mm_imreg,[]);
  3559. end;
  3560. procedure tthumb2cgarm.done_register_allocators;
  3561. begin
  3562. rg[R_INTREGISTER].free;
  3563. rg[R_FPUREGISTER].free;
  3564. rg[R_MMREGISTER].free;
  3565. inherited done_register_allocators;
  3566. end;
  3567. procedure tthumb2cgarm.a_call_reg(list : TAsmList;reg: tregister);
  3568. begin
  3569. list.concat(taicpu.op_reg(A_BLX, reg));
  3570. {
  3571. the compiler does not properly set this flag anymore in pass 1, and
  3572. for now we only need it after pass 2 (I hope) (JM)
  3573. if not(pi_do_call in current_procinfo.flags) then
  3574. internalerror(2003060703);
  3575. }
  3576. include(current_procinfo.flags,pi_do_call);
  3577. end;
  3578. procedure tthumb2cgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3579. var
  3580. imm_shift : byte;
  3581. l : tasmlabel;
  3582. hr : treference;
  3583. begin
  3584. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3585. internalerror(2002090902);
  3586. if is_thumb32_imm(a) then
  3587. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3588. else if is_thumb32_imm(not(a)) then
  3589. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  3590. else if (a and $FFFF)=a then
  3591. list.concat(taicpu.op_reg_const(A_MOVW,reg,a))
  3592. else
  3593. begin
  3594. reference_reset(hr,4);
  3595. current_asmdata.getjumplabel(l);
  3596. cg.a_label(current_procinfo.aktlocaldata,l);
  3597. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3598. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3599. hr.symbol:=l;
  3600. hr.base:=NR_PC;
  3601. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3602. end;
  3603. end;
  3604. procedure tthumb2cgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3605. var
  3606. oppostfix:toppostfix;
  3607. usedtmpref: treference;
  3608. tmpreg,tmpreg2 : tregister;
  3609. so : tshifterop;
  3610. dir : integer;
  3611. begin
  3612. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3613. FromSize := ToSize;
  3614. case FromSize of
  3615. { signed integer registers }
  3616. OS_8:
  3617. oppostfix:=PF_B;
  3618. OS_S8:
  3619. oppostfix:=PF_SB;
  3620. OS_16:
  3621. oppostfix:=PF_H;
  3622. OS_S16:
  3623. oppostfix:=PF_SH;
  3624. OS_32,
  3625. OS_S32:
  3626. oppostfix:=PF_None;
  3627. else
  3628. InternalError(200308297);
  3629. end;
  3630. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3631. begin
  3632. if target_info.endian=endian_big then
  3633. dir:=-1
  3634. else
  3635. dir:=1;
  3636. case FromSize of
  3637. OS_16,OS_S16:
  3638. begin
  3639. { only complicated references need an extra loadaddr }
  3640. if assigned(ref.symbol) or
  3641. (ref.index<>NR_NO) or
  3642. (ref.offset<-255) or
  3643. (ref.offset>4094) or
  3644. { sometimes the compiler reused registers }
  3645. (reg=ref.index) or
  3646. (reg=ref.base) then
  3647. begin
  3648. tmpreg2:=getintregister(list,OS_INT);
  3649. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3650. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3651. end
  3652. else
  3653. usedtmpref:=ref;
  3654. if target_info.endian=endian_big then
  3655. inc(usedtmpref.offset,1);
  3656. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  3657. tmpreg:=getintregister(list,OS_INT);
  3658. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3659. inc(usedtmpref.offset,dir);
  3660. if FromSize=OS_16 then
  3661. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3662. else
  3663. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3664. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  3665. end;
  3666. OS_32,OS_S32:
  3667. begin
  3668. tmpreg:=getintregister(list,OS_INT);
  3669. { only complicated references need an extra loadaddr }
  3670. if assigned(ref.symbol) or
  3671. (ref.index<>NR_NO) or
  3672. (ref.offset<-255) or
  3673. (ref.offset>4092) or
  3674. { sometimes the compiler reused registers }
  3675. (reg=ref.index) or
  3676. (reg=ref.base) then
  3677. begin
  3678. tmpreg2:=getintregister(list,OS_INT);
  3679. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3680. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3681. end
  3682. else
  3683. usedtmpref:=ref;
  3684. shifterop_reset(so);so.shiftmode:=SM_LSL;
  3685. if ref.alignment=2 then
  3686. begin
  3687. if target_info.endian=endian_big then
  3688. inc(usedtmpref.offset,2);
  3689. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  3690. inc(usedtmpref.offset,dir*2);
  3691. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  3692. so.shiftimm:=16;
  3693. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  3694. end
  3695. else
  3696. begin
  3697. if target_info.endian=endian_big then
  3698. inc(usedtmpref.offset,3);
  3699. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3700. inc(usedtmpref.offset,dir);
  3701. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3702. so.shiftimm:=8;
  3703. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  3704. inc(usedtmpref.offset,dir);
  3705. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3706. so.shiftimm:=16;
  3707. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  3708. inc(usedtmpref.offset,dir);
  3709. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3710. so.shiftimm:=24;
  3711. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  3712. end;
  3713. end
  3714. else
  3715. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3716. end;
  3717. end
  3718. else
  3719. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3720. if (fromsize=OS_S8) and (tosize = OS_16) then
  3721. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  3722. end;
  3723. procedure tthumb2cgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  3724. begin
  3725. if op = OP_NOT then
  3726. begin
  3727. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  3728. case size of
  3729. OS_8: list.concat(taicpu.op_reg_reg(A_UXTB,dst,dst));
  3730. OS_S8: list.concat(taicpu.op_reg_reg(A_SXTB,dst,dst));
  3731. OS_16: list.concat(taicpu.op_reg_reg(A_UXTH,dst,dst));
  3732. OS_S16: list.concat(taicpu.op_reg_reg(A_SXTH,dst,dst));
  3733. end;
  3734. end
  3735. else
  3736. inherited a_op_reg_reg(list, op, size, src, dst);
  3737. end;
  3738. procedure tthumb2cgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  3739. var
  3740. shift, width : byte;
  3741. tmpreg : tregister;
  3742. so : tshifterop;
  3743. l1 : longint;
  3744. begin
  3745. ovloc.loc:=LOC_VOID;
  3746. if {$ifopt R+}(a<>-2147483648) and{$endif} is_shifter_const(-a,shift) then
  3747. case op of
  3748. OP_ADD:
  3749. begin
  3750. op:=OP_SUB;
  3751. a:=aint(dword(-a));
  3752. end;
  3753. OP_SUB:
  3754. begin
  3755. op:=OP_ADD;
  3756. a:=aint(dword(-a));
  3757. end
  3758. end;
  3759. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  3760. case op of
  3761. OP_NEG,OP_NOT,
  3762. OP_DIV,OP_IDIV:
  3763. internalerror(200308281);
  3764. OP_SHL:
  3765. begin
  3766. if a>32 then
  3767. internalerror(200308294);
  3768. if a<>0 then
  3769. begin
  3770. shifterop_reset(so);
  3771. so.shiftmode:=SM_LSL;
  3772. so.shiftimm:=a;
  3773. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  3774. end
  3775. else
  3776. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  3777. end;
  3778. OP_ROL:
  3779. begin
  3780. if a>32 then
  3781. internalerror(200308294);
  3782. if a<>0 then
  3783. begin
  3784. shifterop_reset(so);
  3785. so.shiftmode:=SM_ROR;
  3786. so.shiftimm:=32-a;
  3787. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  3788. end
  3789. else
  3790. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  3791. end;
  3792. OP_ROR:
  3793. begin
  3794. if a>32 then
  3795. internalerror(200308294);
  3796. if a<>0 then
  3797. begin
  3798. shifterop_reset(so);
  3799. so.shiftmode:=SM_ROR;
  3800. so.shiftimm:=a;
  3801. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  3802. end
  3803. else
  3804. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  3805. end;
  3806. OP_SHR:
  3807. begin
  3808. if a>32 then
  3809. internalerror(200308292);
  3810. shifterop_reset(so);
  3811. if a<>0 then
  3812. begin
  3813. so.shiftmode:=SM_LSR;
  3814. so.shiftimm:=a;
  3815. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  3816. end
  3817. else
  3818. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  3819. end;
  3820. OP_SAR:
  3821. begin
  3822. if a>32 then
  3823. internalerror(200308295);
  3824. if a<>0 then
  3825. begin
  3826. shifterop_reset(so);
  3827. so.shiftmode:=SM_ASR;
  3828. so.shiftimm:=a;
  3829. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  3830. end
  3831. else
  3832. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  3833. end;
  3834. else
  3835. if (op in [OP_SUB, OP_ADD]) and
  3836. ((a < 0) or
  3837. (a > 4095)) then
  3838. begin
  3839. tmpreg:=getintregister(list,size);
  3840. a_load_const_reg(list, size, a, tmpreg);
  3841. if cgsetflags or setflags then
  3842. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3843. list.concat(setoppostfix(
  3844. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  3845. end
  3846. else
  3847. begin
  3848. if cgsetflags or setflags then
  3849. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3850. list.concat(setoppostfix(
  3851. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  3852. end;
  3853. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  3854. begin
  3855. ovloc.loc:=LOC_FLAGS;
  3856. case op of
  3857. OP_ADD:
  3858. ovloc.resflags:=F_CS;
  3859. OP_SUB:
  3860. ovloc.resflags:=F_CC;
  3861. end;
  3862. end;
  3863. end
  3864. else
  3865. begin
  3866. { there could be added some more sophisticated optimizations }
  3867. if (op in [OP_MUL,OP_IMUL]) and (a=1) then
  3868. a_load_reg_reg(list,size,size,src,dst)
  3869. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  3870. a_load_const_reg(list,size,0,dst)
  3871. else if (op in [OP_IMUL]) and (a=-1) then
  3872. a_op_reg_reg(list,OP_NEG,size,src,dst)
  3873. { we do this here instead in the peephole optimizer because
  3874. it saves us a register }
  3875. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  3876. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  3877. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  3878. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  3879. begin
  3880. if l1>32 then{roozbeh does this ever happen?}
  3881. internalerror(200308296);
  3882. shifterop_reset(so);
  3883. so.shiftmode:=SM_LSL;
  3884. so.shiftimm:=l1;
  3885. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  3886. end
  3887. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  3888. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  3889. begin
  3890. if l1>32 then{does this ever happen?}
  3891. internalerror(201205181);
  3892. shifterop_reset(so);
  3893. so.shiftmode:=SM_LSL;
  3894. so.shiftimm:=l1;
  3895. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  3896. end
  3897. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  3898. begin
  3899. { nothing to do on success }
  3900. end
  3901. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  3902. Just using mov x, #0 might allow some easier optimizations down the line. }
  3903. else if (op = OP_AND) and (dword(a)=0) then
  3904. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  3905. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  3906. else if (op = OP_AND) and (not(dword(a))=0) then
  3907. list.concat(taicpu.op_reg_reg(A_MOV,dst,src))
  3908. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  3909. broader range of shifterconstants.}
  3910. {else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  3911. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))}
  3912. else if (op = OP_AND) and is_thumb32_imm(a) then
  3913. list.concat(taicpu.op_reg_reg_const(A_MOV,dst,src,dword(a)))
  3914. else if (op = OP_AND) and (a = $FFFF) then
  3915. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  3916. else if (op = OP_AND) and is_thumb32_imm(not(dword(a))) then
  3917. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  3918. else if (op = OP_AND) and is_continuous_mask(not(a), shift, width) then
  3919. begin
  3920. a_load_reg_reg(list,size,size,src,dst);
  3921. list.concat(taicpu.op_reg_const_const(A_BFC,dst,shift,width))
  3922. end
  3923. else
  3924. begin
  3925. tmpreg:=getintregister(list,size);
  3926. a_load_const_reg(list,size,a,tmpreg);
  3927. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  3928. end;
  3929. end;
  3930. maybeadjustresult(list,op,size,dst);
  3931. end;
  3932. const
  3933. op_reg_reg_opcg2asmopThumb2: array[TOpCG] of tasmop =
  3934. (A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NONE,A_MVN,A_ORR,
  3935. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  3936. procedure tthumb2cgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  3937. var
  3938. so : tshifterop;
  3939. tmpreg,overflowreg : tregister;
  3940. asmop : tasmop;
  3941. begin
  3942. ovloc.loc:=LOC_VOID;
  3943. case op of
  3944. OP_NEG,OP_NOT:
  3945. internalerror(200308281);
  3946. OP_ROL:
  3947. begin
  3948. if not(size in [OS_32,OS_S32]) then
  3949. internalerror(2008072801);
  3950. { simulate ROL by ror'ing 32-value }
  3951. tmpreg:=getintregister(list,OS_32);
  3952. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,32));
  3953. list.concat(taicpu.op_reg_reg_reg(A_SUB,src1,tmpreg,src1));
  3954. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  3955. end;
  3956. OP_ROR:
  3957. begin
  3958. if not(size in [OS_32,OS_S32]) then
  3959. internalerror(2008072802);
  3960. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  3961. end;
  3962. OP_IMUL,
  3963. OP_MUL:
  3964. begin
  3965. if cgsetflags or setflags then
  3966. begin
  3967. overflowreg:=getintregister(list,size);
  3968. if op=OP_IMUL then
  3969. asmop:=A_SMULL
  3970. else
  3971. asmop:=A_UMULL;
  3972. { the arm doesn't allow that rd and rm are the same }
  3973. if dst=src2 then
  3974. begin
  3975. if dst<>src1 then
  3976. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  3977. else
  3978. begin
  3979. tmpreg:=getintregister(list,size);
  3980. a_load_reg_reg(list,size,size,src2,dst);
  3981. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  3982. end;
  3983. end
  3984. else
  3985. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  3986. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3987. if op=OP_IMUL then
  3988. begin
  3989. shifterop_reset(so);
  3990. so.shiftmode:=SM_ASR;
  3991. so.shiftimm:=31;
  3992. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  3993. end
  3994. else
  3995. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  3996. ovloc.loc:=LOC_FLAGS;
  3997. ovloc.resflags:=F_NE;
  3998. end
  3999. else
  4000. begin
  4001. { the arm doesn't allow that rd and rm are the same }
  4002. if dst=src2 then
  4003. begin
  4004. if dst<>src1 then
  4005. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  4006. else
  4007. begin
  4008. tmpreg:=getintregister(list,size);
  4009. a_load_reg_reg(list,size,size,src2,dst);
  4010. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  4011. end;
  4012. end
  4013. else
  4014. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  4015. end;
  4016. end;
  4017. else
  4018. begin
  4019. if cgsetflags or setflags then
  4020. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4021. list.concat(setoppostfix(
  4022. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmopThumb2[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4023. end;
  4024. end;
  4025. maybeadjustresult(list,op,size,dst);
  4026. end;
  4027. procedure tthumb2cgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  4028. var item: taicpu;
  4029. begin
  4030. list.concat(taicpu.op_cond(A_ITE, flags_to_cond(f)));
  4031. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  4032. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  4033. end;
  4034. procedure tthumb2cgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  4035. var
  4036. ref : treference;
  4037. shift : byte;
  4038. firstfloatreg,lastfloatreg,
  4039. r : byte;
  4040. regs : tcpuregisterset;
  4041. stackmisalignment: pint;
  4042. begin
  4043. LocalSize:=align(LocalSize,4);
  4044. { call instruction does not put anything on the stack }
  4045. stackmisalignment:=0;
  4046. if not(nostackframe) then
  4047. begin
  4048. firstfloatreg:=RS_NO;
  4049. { save floating point registers? }
  4050. for r:=RS_F0 to RS_F7 do
  4051. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4052. begin
  4053. if firstfloatreg=RS_NO then
  4054. firstfloatreg:=r;
  4055. lastfloatreg:=r;
  4056. inc(stackmisalignment,12);
  4057. end;
  4058. a_reg_alloc(list,NR_STACK_POINTER_REG);
  4059. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4060. begin
  4061. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  4062. a_reg_alloc(list,NR_R12);
  4063. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  4064. end;
  4065. { save int registers }
  4066. reference_reset(ref,4);
  4067. ref.index:=NR_STACK_POINTER_REG;
  4068. ref.addressmode:=AM_PREINDEXED;
  4069. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4070. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4071. regs:=regs+[RS_FRAME_POINTER_REG,RS_R14]
  4072. else if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  4073. include(regs,RS_R14);
  4074. if regs<>[] then
  4075. begin
  4076. for r:=RS_R0 to RS_R15 do
  4077. if (r in regs) then
  4078. inc(stackmisalignment,4);
  4079. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4080. end;
  4081. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4082. begin
  4083. { the framepointer now points to the saved R15, so the saved
  4084. framepointer is at R11-12 (for get_caller_frame) }
  4085. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  4086. a_reg_dealloc(list,NR_R12);
  4087. end;
  4088. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4089. if (LocalSize<>0) or
  4090. ((stackmisalignment<>0) and
  4091. ((pi_do_call in current_procinfo.flags) or
  4092. (po_assembler in current_procinfo.procdef.procoptions))) then
  4093. begin
  4094. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4095. if not(is_shifter_const(localsize,shift)) then
  4096. begin
  4097. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  4098. a_reg_alloc(list,NR_R12);
  4099. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4100. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  4101. a_reg_dealloc(list,NR_R12);
  4102. end
  4103. else
  4104. begin
  4105. a_reg_dealloc(list,NR_R12);
  4106. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  4107. end;
  4108. end;
  4109. if firstfloatreg<>RS_NO then
  4110. begin
  4111. reference_reset(ref,4);
  4112. if tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023 then
  4113. begin
  4114. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  4115. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4116. ref.base:=NR_R12;
  4117. end
  4118. else
  4119. begin
  4120. ref.base:=current_procinfo.framepointer;
  4121. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  4122. end;
  4123. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4124. lastfloatreg-firstfloatreg+1,ref));
  4125. end;
  4126. end;
  4127. end;
  4128. procedure tthumb2cgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  4129. var
  4130. ref : treference;
  4131. firstfloatreg,lastfloatreg,
  4132. r : byte;
  4133. shift : byte;
  4134. regs : tcpuregisterset;
  4135. LocalSize : longint;
  4136. stackmisalignment: pint;
  4137. begin
  4138. if not(nostackframe) then
  4139. begin
  4140. stackmisalignment:=0;
  4141. { restore floating point register }
  4142. firstfloatreg:=RS_NO;
  4143. { save floating point registers? }
  4144. for r:=RS_F0 to RS_F7 do
  4145. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4146. begin
  4147. if firstfloatreg=RS_NO then
  4148. firstfloatreg:=r;
  4149. lastfloatreg:=r;
  4150. { floating point register space is already included in
  4151. localsize below by calc_stackframe_size
  4152. inc(stackmisalignment,12);
  4153. }
  4154. end;
  4155. if firstfloatreg<>RS_NO then
  4156. begin
  4157. reference_reset(ref,4);
  4158. if tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023 then
  4159. begin
  4160. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  4161. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4162. ref.base:=NR_R12;
  4163. end
  4164. else
  4165. begin
  4166. ref.base:=current_procinfo.framepointer;
  4167. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  4168. end;
  4169. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4170. lastfloatreg-firstfloatreg+1,ref));
  4171. end;
  4172. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4173. if (pi_do_call in current_procinfo.flags) or (regs<>[]) then
  4174. begin
  4175. exclude(regs,RS_R14);
  4176. include(regs,RS_R15);
  4177. end;
  4178. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  4179. regs:=regs+[RS_FRAME_POINTER_REG,RS_R15];
  4180. for r:=RS_R0 to RS_R15 do
  4181. if (r in regs) then
  4182. inc(stackmisalignment,4);
  4183. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4184. LocalSize:=current_procinfo.calc_stackframe_size;
  4185. if (LocalSize<>0) or
  4186. ((stackmisalignment<>0) and
  4187. ((pi_do_call in current_procinfo.flags) or
  4188. (po_assembler in current_procinfo.procdef.procoptions))) then
  4189. begin
  4190. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4191. if not(is_shifter_const(LocalSize,shift)) then
  4192. begin
  4193. a_reg_alloc(list,NR_R12);
  4194. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4195. list.concat(taicpu.op_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_R12));
  4196. a_reg_dealloc(list,NR_R12);
  4197. end
  4198. else
  4199. begin
  4200. a_reg_dealloc(list,NR_R12);
  4201. list.concat(taicpu.op_reg_const(A_ADD,NR_STACK_POINTER_REG,LocalSize));
  4202. end;
  4203. end;
  4204. if regs=[] then
  4205. list.concat(taicpu.op_reg_reg(A_MOV,NR_R15,NR_R14))
  4206. else
  4207. begin
  4208. reference_reset(ref,4);
  4209. ref.index:=NR_STACK_POINTER_REG;
  4210. ref.addressmode:=AM_PREINDEXED;
  4211. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4212. end;
  4213. end
  4214. else
  4215. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14));
  4216. end;
  4217. function tthumb2cgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  4218. var
  4219. tmpreg : tregister;
  4220. tmpref : treference;
  4221. l : tasmlabel;
  4222. so: tshifterop;
  4223. begin
  4224. tmpreg:=NR_NO;
  4225. { Be sure to have a base register }
  4226. if (ref.base=NR_NO) then
  4227. begin
  4228. if ref.shiftmode<>SM_None then
  4229. internalerror(200308294);
  4230. ref.base:=ref.index;
  4231. ref.index:=NR_NO;
  4232. end;
  4233. { absolute symbols can't be handled directly, we've to store the symbol reference
  4234. in the text segment and access it pc relative
  4235. For now, we assume that references where base or index equals to PC are already
  4236. relative, all other references are assumed to be absolute and thus they need
  4237. to be handled extra.
  4238. A proper solution would be to change refoptions to a set and store the information
  4239. if the symbol is absolute or relative there.
  4240. }
  4241. if (assigned(ref.symbol) and
  4242. not(is_pc(ref.base)) and
  4243. not(is_pc(ref.index))
  4244. ) or
  4245. { [#xxx] isn't a valid address operand }
  4246. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  4247. //(ref.offset<-4095) or
  4248. (ref.offset<-255) or
  4249. (ref.offset>4095) or
  4250. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  4251. ((ref.offset<-255) or
  4252. (ref.offset>255)
  4253. )
  4254. ) or
  4255. ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) and
  4256. ((ref.offset<-1020) or
  4257. (ref.offset>1020) or
  4258. { the usual pc relative symbol handling assumes possible offsets of +/- 4095 }
  4259. assigned(ref.symbol)
  4260. )
  4261. ) then
  4262. begin
  4263. reference_reset(tmpref,4);
  4264. { load symbol }
  4265. tmpreg:=getintregister(list,OS_INT);
  4266. if assigned(ref.symbol) then
  4267. begin
  4268. current_asmdata.getjumplabel(l);
  4269. cg.a_label(current_procinfo.aktlocaldata,l);
  4270. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  4271. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset));
  4272. { load consts entry }
  4273. tmpref.symbol:=l;
  4274. tmpref.base:=NR_R15;
  4275. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  4276. { in case of LDF/STF, we got rid of the NR_R15 }
  4277. if is_pc(ref.base) then
  4278. ref.base:=NR_NO;
  4279. if is_pc(ref.index) then
  4280. ref.index:=NR_NO;
  4281. end
  4282. else
  4283. a_load_const_reg(list,OS_ADDR,ref.offset,tmpreg);
  4284. if (ref.base<>NR_NO) then
  4285. begin
  4286. if ref.index<>NR_NO then
  4287. begin
  4288. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4289. ref.base:=tmpreg;
  4290. end
  4291. else
  4292. begin
  4293. ref.index:=tmpreg;
  4294. ref.shiftimm:=0;
  4295. ref.signindex:=1;
  4296. ref.shiftmode:=SM_None;
  4297. end;
  4298. end
  4299. else
  4300. ref.base:=tmpreg;
  4301. ref.offset:=0;
  4302. ref.symbol:=nil;
  4303. end;
  4304. if (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  4305. begin
  4306. if tmpreg<>NR_NO then
  4307. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg,tmpreg)
  4308. else
  4309. begin
  4310. tmpreg:=getintregister(list,OS_ADDR);
  4311. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg);
  4312. ref.base:=tmpreg;
  4313. end;
  4314. ref.offset:=0;
  4315. end;
  4316. { Hack? Thumb2 doesn't allow PC indexed addressing modes(although it does in the specification) }
  4317. if (ref.base=NR_R15) and (ref.index<>NR_NO) and (ref.shiftmode <> sm_none) then
  4318. begin
  4319. tmpreg:=getintregister(list,OS_ADDR);
  4320. list.concat(taicpu.op_reg_reg(A_MOV, tmpreg, NR_R15));
  4321. ref.base := tmpreg;
  4322. end;
  4323. { floating point operations have only limited references
  4324. we expect here, that a base is already set }
  4325. if (op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) and (ref.index<>NR_NO) then
  4326. begin
  4327. if ref.shiftmode<>SM_none then
  4328. internalerror(200309121);
  4329. if tmpreg<>NR_NO then
  4330. begin
  4331. if ref.base=tmpreg then
  4332. begin
  4333. if ref.signindex<0 then
  4334. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,tmpreg,ref.index))
  4335. else
  4336. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,tmpreg,ref.index));
  4337. ref.index:=NR_NO;
  4338. end
  4339. else
  4340. begin
  4341. if ref.index<>tmpreg then
  4342. internalerror(200403161);
  4343. if ref.signindex<0 then
  4344. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,ref.base,tmpreg))
  4345. else
  4346. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4347. ref.base:=tmpreg;
  4348. ref.index:=NR_NO;
  4349. end;
  4350. end
  4351. else
  4352. begin
  4353. tmpreg:=getintregister(list,OS_ADDR);
  4354. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));
  4355. ref.base:=tmpreg;
  4356. ref.index:=NR_NO;
  4357. end;
  4358. end;
  4359. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  4360. Result := ref;
  4361. end;
  4362. procedure tthumb2cgarm.a_loadmm_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister; shuffle: pmmshuffle);
  4363. var
  4364. instr: taicpu;
  4365. begin
  4366. if (fromsize=OS_F32) and
  4367. (tosize=OS_F32) then
  4368. begin
  4369. instr:=setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32);
  4370. list.Concat(instr);
  4371. add_move_instruction(instr);
  4372. end
  4373. else if (fromsize=OS_F64) and
  4374. (tosize=OS_F64) then
  4375. begin
  4376. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,tregister(longint(reg2)+1),tregister(longint(reg1)+1)), PF_F32));
  4377. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32));
  4378. end
  4379. else if (fromsize=OS_F32) and
  4380. (tosize=OS_F64) then
  4381. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VCVT,reg2,reg1), PF_F32))
  4382. begin
  4383. //list.concat(nil);
  4384. end;
  4385. end;
  4386. procedure tthumb2cgarm.a_loadmm_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  4387. var
  4388. href: treference;
  4389. tmpreg: TRegister;
  4390. so: tshifterop;
  4391. begin
  4392. href:=ref;
  4393. if (href.base<>NR_NO) and
  4394. (href.index<>NR_NO) then
  4395. begin
  4396. tmpreg:=getintregister(list,OS_INT);
  4397. if href.shiftmode<>SM_None then
  4398. begin
  4399. so.rs:=href.index;
  4400. so.shiftimm:=href.shiftimm;
  4401. so.shiftmode:=href.shiftmode;
  4402. list.concat(taicpu.op_reg_reg_shifterop(A_ADD,tmpreg,href.base,so));
  4403. end
  4404. else
  4405. a_op_reg_reg_reg(list,OP_ADD,OS_INT,href.index,href.base,tmpreg);
  4406. reference_reset_base(href,tmpreg,href.offset,0);
  4407. end;
  4408. if assigned(href.symbol) then
  4409. begin
  4410. tmpreg:=getintregister(list,OS_INT);
  4411. a_loadaddr_ref_reg(list,href,tmpreg);
  4412. reference_reset_base(href,tmpreg,0,0);
  4413. end;
  4414. if fromsize=OS_F32 then
  4415. list.Concat(setoppostfix(taicpu.op_reg_ref(A_VLDR,reg,href), PF_F32))
  4416. else
  4417. list.Concat(setoppostfix(taicpu.op_reg_ref(A_VLDR,reg,href), PF_F64));
  4418. end;
  4419. procedure tthumb2cgarm.a_loadmm_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  4420. var
  4421. href: treference;
  4422. so: tshifterop;
  4423. tmpreg: TRegister;
  4424. begin
  4425. href:=ref;
  4426. if (href.base<>NR_NO) and
  4427. (href.index<>NR_NO) then
  4428. begin
  4429. tmpreg:=getintregister(list,OS_INT);
  4430. if href.shiftmode<>SM_None then
  4431. begin
  4432. so.rs:=href.index;
  4433. so.shiftimm:=href.shiftimm;
  4434. so.shiftmode:=href.shiftmode;
  4435. list.concat(taicpu.op_reg_reg_shifterop(A_ADD,tmpreg,href.base,so));
  4436. end
  4437. else
  4438. a_op_reg_reg_reg(list,OP_ADD,OS_INT,href.index,href.base,tmpreg);
  4439. reference_reset_base(href,tmpreg,href.offset,0);
  4440. end;
  4441. if assigned(href.symbol) then
  4442. begin
  4443. tmpreg:=getintregister(list,OS_INT);
  4444. a_loadaddr_ref_reg(list,href,tmpreg);
  4445. reference_reset_base(href,tmpreg,0,0);
  4446. end;
  4447. if fromsize=OS_F32 then
  4448. list.Concat(setoppostfix(taicpu.op_reg_ref(A_VSTR,reg,href), PF_32))
  4449. else
  4450. list.Concat(setoppostfix(taicpu.op_reg_ref(A_VSTR,reg,href), PF_64));
  4451. end;
  4452. procedure tthumb2cgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize: tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  4453. begin
  4454. if //(shuffle=nil) and
  4455. (tosize=OS_F32) then
  4456. list.Concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg))
  4457. else
  4458. internalerror(2012100813);
  4459. end;
  4460. procedure tthumb2cgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize: tcgsize; mmreg, intreg: tregister; shuffle: pmmshuffle);
  4461. begin
  4462. if //(shuffle=nil) and
  4463. (fromsize=OS_F32) then
  4464. list.Concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg))
  4465. else
  4466. internalerror(2012100814);
  4467. end;
  4468. procedure tthumb2cg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  4469. var tmpreg: tregister;
  4470. begin
  4471. case op of
  4472. OP_NEG:
  4473. begin
  4474. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4475. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  4476. tmpreg:=cg.getintregister(list,OS_32);
  4477. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,0));
  4478. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,tmpreg,regsrc.reghi));
  4479. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4480. end;
  4481. else
  4482. inherited a_op64_reg_reg(list, op, size, regsrc, regdst);
  4483. end;
  4484. end;
  4485. procedure tthumbcg64farm.a_op64_reg_reg(list: TAsmList; op: TOpCG; size: tcgsize; regsrc, regdst: tregister64);
  4486. begin
  4487. case op of
  4488. OP_NEG:
  4489. begin
  4490. list.concat(taicpu.op_reg_const(A_MOV,regdst.reglo,0));
  4491. list.concat(taicpu.op_reg_const(A_MOV,regdst.reghi,0));
  4492. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4493. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4494. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4495. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4496. end;
  4497. OP_NOT:
  4498. begin
  4499. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  4500. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  4501. end;
  4502. OP_AND,OP_OR,OP_XOR:
  4503. begin
  4504. cg.a_op_reg_reg(list,op,OS_32,regsrc.reglo,regdst.reglo);
  4505. cg.a_op_reg_reg(list,op,OS_32,regsrc.reghi,regdst.reghi);
  4506. end;
  4507. OP_ADD:
  4508. begin
  4509. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4510. list.concat(taicpu.op_reg_reg(A_ADD,regdst.reglo,regsrc.reglo));
  4511. list.concat(taicpu.op_reg_reg(A_ADC,regdst.reghi,regsrc.reghi));
  4512. end;
  4513. OP_SUB:
  4514. begin
  4515. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4516. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4517. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4518. end;
  4519. else
  4520. internalerror(2003083101);
  4521. end;
  4522. end;
  4523. procedure tthumbcg64farm.a_op64_const_reg(list: TAsmList; op: TOpCG; size: tcgsize; value: int64; reg: tregister64);
  4524. var
  4525. tmpreg : tregister;
  4526. b : byte;
  4527. begin
  4528. case op of
  4529. OP_AND,OP_OR,OP_XOR:
  4530. begin
  4531. cg.a_op_const_reg(list,op,OS_32,aint(lo(value)),reg.reglo);
  4532. cg.a_op_const_reg(list,op,OS_32,aint(hi(value)),reg.reghi);
  4533. end;
  4534. OP_ADD:
  4535. begin
  4536. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4537. begin
  4538. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4539. list.concat(taicpu.op_reg_const(A_ADD,reg.reglo,aint(lo(value))));
  4540. end
  4541. else
  4542. begin
  4543. tmpreg:=cg.getintregister(list,OS_32);
  4544. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4545. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4546. list.concat(taicpu.op_reg_reg(A_ADD,reg.reglo,tmpreg));
  4547. end;
  4548. tmpreg:=cg.getintregister(list,OS_32);
  4549. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  4550. list.concat(taicpu.op_reg_reg(A_ADC,reg.reghi,tmpreg));
  4551. end;
  4552. OP_SUB:
  4553. begin
  4554. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4555. begin
  4556. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4557. list.concat(taicpu.op_reg_const(A_SUB,reg.reglo,aint(lo(value))))
  4558. end
  4559. else
  4560. begin
  4561. tmpreg:=cg.getintregister(list,OS_32);
  4562. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4563. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4564. list.concat(taicpu.op_reg_reg(A_SUB,reg.reglo,tmpreg));
  4565. end;
  4566. tmpreg:=cg.getintregister(list,OS_32);
  4567. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  4568. list.concat(taicpu.op_reg_reg(A_SBC,reg.reghi,tmpreg));
  4569. end;
  4570. else
  4571. internalerror(2003083101);
  4572. end;
  4573. end;
  4574. procedure create_codegen;
  4575. begin
  4576. if current_settings.cputype in cpu_thumb2 then
  4577. begin
  4578. cg:=tthumb2cgarm.create;
  4579. cg64:=tthumb2cg64farm.create;
  4580. casmoptimizer:=TCpuThumb2AsmOptimizer;
  4581. end
  4582. else if current_settings.cputype in cpu_thumb then
  4583. begin
  4584. cg:=tthumbcgarm.create;
  4585. cg64:=tthumbcg64farm.create;
  4586. // casmoptimizer:=TCpuThumbAsmOptimizer;
  4587. end
  4588. else
  4589. begin
  4590. cg:=tarmcgarm.create;
  4591. cg64:=tarmcg64farm.create;
  4592. casmoptimizer:=TCpuAsmOptimizer;
  4593. end;
  4594. end;
  4595. end.