cgcpu.pas 212 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228322932303231323232333234323532363237323832393240324132423243324432453246324732483249325032513252325332543255325632573258325932603261326232633264326532663267326832693270327132723273327432753276327732783279328032813282328332843285328632873288328932903291329232933294329532963297329832993300330133023303330433053306330733083309331033113312331333143315331633173318331933203321332233233324332533263327332833293330333133323333333433353336333733383339334033413342334333443345334633473348334933503351335233533354335533563357335833593360336133623363336433653366336733683369337033713372337333743375337633773378337933803381338233833384338533863387338833893390339133923393339433953396339733983399340034013402340334043405340634073408340934103411341234133414341534163417341834193420342134223423342434253426342734283429343034313432343334343435343634373438343934403441344234433444344534463447344834493450345134523453345434553456345734583459346034613462346334643465346634673468346934703471347234733474347534763477347834793480348134823483348434853486348734883489349034913492349334943495349634973498349935003501350235033504350535063507350835093510351135123513351435153516351735183519352035213522352335243525352635273528352935303531353235333534353535363537353835393540354135423543354435453546354735483549355035513552355335543555355635573558355935603561356235633564356535663567356835693570357135723573357435753576357735783579358035813582358335843585358635873588358935903591359235933594359535963597359835993600360136023603360436053606360736083609361036113612361336143615361636173618361936203621362236233624362536263627362836293630363136323633363436353636363736383639364036413642364336443645364636473648364936503651365236533654365536563657365836593660366136623663366436653666366736683669367036713672367336743675367636773678367936803681368236833684368536863687368836893690369136923693369436953696369736983699370037013702370337043705370637073708370937103711371237133714371537163717371837193720372137223723372437253726372737283729373037313732373337343735373637373738373937403741374237433744374537463747374837493750375137523753375437553756375737583759376037613762376337643765376637673768376937703771377237733774377537763777377837793780378137823783378437853786378737883789379037913792379337943795379637973798379938003801380238033804380538063807380838093810381138123813381438153816381738183819382038213822382338243825382638273828382938303831383238333834383538363837383838393840384138423843384438453846384738483849385038513852385338543855385638573858385938603861386238633864386538663867386838693870387138723873387438753876387738783879388038813882388338843885388638873888388938903891389238933894389538963897389838993900390139023903390439053906390739083909391039113912391339143915391639173918391939203921392239233924392539263927392839293930393139323933393439353936393739383939394039413942394339443945394639473948394939503951395239533954395539563957395839593960396139623963396439653966396739683969397039713972397339743975397639773978397939803981398239833984398539863987398839893990399139923993399439953996399739983999400040014002400340044005400640074008400940104011401240134014401540164017401840194020402140224023402440254026402740284029403040314032403340344035403640374038403940404041404240434044404540464047404840494050405140524053405440554056405740584059406040614062406340644065406640674068406940704071407240734074407540764077407840794080408140824083408440854086408740884089409040914092409340944095409640974098409941004101410241034104410541064107410841094110411141124113411441154116411741184119412041214122412341244125412641274128412941304131413241334134413541364137413841394140414141424143414441454146414741484149415041514152415341544155415641574158415941604161416241634164416541664167416841694170417141724173417441754176417741784179418041814182418341844185418641874188418941904191419241934194419541964197419841994200420142024203420442054206420742084209421042114212421342144215421642174218421942204221422242234224422542264227422842294230423142324233423442354236423742384239424042414242424342444245424642474248424942504251425242534254425542564257425842594260426142624263426442654266426742684269427042714272427342744275427642774278427942804281428242834284428542864287428842894290429142924293429442954296429742984299430043014302430343044305430643074308430943104311431243134314431543164317431843194320432143224323432443254326432743284329433043314332433343344335433643374338433943404341434243434344434543464347434843494350435143524353435443554356435743584359436043614362436343644365436643674368436943704371437243734374437543764377437843794380438143824383438443854386438743884389439043914392439343944395439643974398439944004401440244034404440544064407440844094410441144124413441444154416441744184419442044214422442344244425442644274428442944304431443244334434443544364437443844394440444144424443444444454446444744484449445044514452445344544455445644574458445944604461446244634464446544664467446844694470447144724473447444754476447744784479448044814482448344844485448644874488448944904491449244934494449544964497449844994500450145024503450445054506450745084509451045114512451345144515451645174518451945204521452245234524452545264527452845294530453145324533453445354536453745384539454045414542454345444545454645474548454945504551455245534554455545564557455845594560456145624563456445654566456745684569457045714572457345744575457645774578457945804581458245834584458545864587458845894590459145924593459445954596459745984599460046014602460346044605460646074608460946104611461246134614461546164617461846194620462146224623462446254626462746284629463046314632463346344635463646374638463946404641464246434644464546464647464846494650465146524653465446554656465746584659466046614662466346644665466646674668466946704671467246734674467546764677467846794680468146824683468446854686468746884689469046914692469346944695469646974698469947004701470247034704470547064707470847094710471147124713471447154716471747184719472047214722472347244725472647274728472947304731473247334734473547364737473847394740474147424743474447454746474747484749475047514752475347544755475647574758475947604761476247634764476547664767476847694770477147724773477447754776477747784779478047814782478347844785478647874788478947904791479247934794479547964797479847994800480148024803480448054806480748084809481048114812481348144815481648174818481948204821482248234824482548264827482848294830483148324833483448354836483748384839484048414842484348444845484648474848484948504851485248534854485548564857485848594860486148624863486448654866486748684869487048714872487348744875487648774878487948804881488248834884488548864887488848894890489148924893489448954896489748984899490049014902490349044905490649074908490949104911491249134914491549164917491849194920492149224923492449254926492749284929493049314932493349344935493649374938493949404941494249434944494549464947494849494950495149524953495449554956495749584959496049614962496349644965496649674968496949704971497249734974497549764977497849794980498149824983498449854986498749884989499049914992499349944995499649974998499950005001500250035004500550065007500850095010501150125013501450155016501750185019502050215022502350245025502650275028502950305031503250335034503550365037503850395040504150425043504450455046504750485049505050515052505350545055505650575058505950605061506250635064506550665067506850695070507150725073507450755076507750785079508050815082508350845085508650875088508950905091509250935094509550965097509850995100510151025103510451055106510751085109511051115112511351145115511651175118511951205121512251235124512551265127512851295130513151325133513451355136513751385139514051415142514351445145514651475148514951505151515251535154515551565157515851595160516151625163516451655166516751685169517051715172517351745175517651775178517951805181518251835184518551865187518851895190519151925193519451955196519751985199520052015202520352045205520652075208520952105211521252135214521552165217521852195220522152225223522452255226522752285229523052315232523352345235523652375238523952405241524252435244524552465247524852495250525152525253525452555256525752585259526052615262526352645265526652675268526952705271527252735274527552765277527852795280528152825283528452855286528752885289529052915292529352945295529652975298529953005301530253035304530553065307530853095310
  1. {
  2. Copyright (c) 2003 by Florian Klaempfl
  3. Member of the Free Pascal development team
  4. This unit implements the code generator for the ARM
  5. This program is free software; you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation; either version 2 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program; if not, write to the Free Software
  15. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  16. ****************************************************************************
  17. }
  18. unit cgcpu;
  19. {$i fpcdefs.inc}
  20. interface
  21. uses
  22. globtype,symtype,symdef,
  23. cgbase,cgutils,cgobj,
  24. aasmbase,aasmcpu,aasmtai,aasmdata,
  25. parabase,
  26. cpubase,cpuinfo,cg64f32,rgcpu;
  27. type
  28. { tbasecgarm is shared between all arm architectures }
  29. tbasecgarm = class(tcg)
  30. { true, if the next arithmetic operation should modify the flags }
  31. cgsetflags : boolean;
  32. procedure a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);override;
  33. procedure a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);override;
  34. procedure a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);override;
  35. procedure a_call_name(list : TAsmList;const s : string; weak: boolean);override;
  36. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  37. { move instructions }
  38. procedure a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);override;
  39. procedure a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);override;
  40. function a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  41. function a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  42. { fpu move instructions }
  43. procedure a_loadfpu_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister); override;
  44. procedure a_loadfpu_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister); override;
  45. procedure a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference); override;
  46. procedure a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);override;
  47. { comparison operations }
  48. procedure a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  49. l : tasmlabel);override;
  50. procedure a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel); override;
  51. procedure a_jmp_name(list : TAsmList;const s : string); override;
  52. procedure a_jmp_always(list : TAsmList;l: tasmlabel); override;
  53. procedure a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel); override;
  54. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  55. procedure g_profilecode(list : TAsmList); override;
  56. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  57. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  58. procedure g_maybe_got_init(list : TAsmList); override;
  59. procedure a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);override;
  60. procedure g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);override;
  61. procedure g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);override;
  62. procedure g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  63. procedure g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  64. procedure g_overflowcheck(list: TAsmList; const l: tlocation; def: tdef); override;
  65. procedure g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);override;
  66. procedure g_save_registers(list : TAsmList);override;
  67. procedure g_restore_registers(list : TAsmList);override;
  68. procedure a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  69. procedure fixref(list : TAsmList;var ref : treference);
  70. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; virtual;
  71. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  72. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  73. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  74. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  75. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  76. procedure a_opmm_reg_reg(list: TAsmList; Op: TOpCG; size : tcgsize;src,dst: tregister;shuffle : pmmshuffle); override;
  77. { Transform unsupported methods into Internal errors }
  78. procedure a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister); override;
  79. { try to generate optimized 32 Bit multiplication, returns true if successful generated }
  80. function try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  81. { clear out potential overflow bits from 8 or 16 bit operations }
  82. { the upper 24/16 bits of a register after an operation }
  83. procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  84. { mla for thumb requires that none of the registers is equal to r13/r15, this method ensures this }
  85. procedure safe_mla(list: TAsmList;op1,op2,op3,op4 : TRegister);
  86. end;
  87. { tcgarm is shared between normal arm and thumb-2 }
  88. tcgarm = class(tbasecgarm)
  89. procedure a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister); override;
  90. procedure a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference); override;
  91. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  92. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  93. size: tcgsize; a: tcgint; src, dst: tregister); override;
  94. procedure a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  95. size: tcgsize; src1, src2, dst: tregister); override;
  96. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  97. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  98. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  99. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  100. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  101. {Multiply two 32-bit registers into lo and hi 32-bit registers}
  102. procedure a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister); override;
  103. end;
  104. { normal arm cg }
  105. tarmcgarm = class(tcgarm)
  106. procedure init_register_allocators;override;
  107. procedure done_register_allocators;override;
  108. end;
  109. { 64 bit cg for all arm flavours }
  110. tbasecg64farm = class(tcg64f32)
  111. end;
  112. { tcg64farm is shared between normal arm and thumb-2 }
  113. tcg64farm = class(tbasecg64farm)
  114. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  115. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  116. procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;
  117. procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  118. procedure a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  119. procedure a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  120. procedure a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);override;
  121. procedure a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);override;
  122. end;
  123. tarmcg64farm = class(tcg64farm)
  124. end;
  125. tthumbcgarm = class(tbasecgarm)
  126. procedure init_register_allocators;override;
  127. procedure done_register_allocators;override;
  128. procedure g_proc_entry(list: TAsmList; localsize: longint; nostackframe: boolean);override;
  129. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  130. procedure a_op_reg_reg(list: TAsmList; Op: TOpCG; size: TCGSize; src,dst: TRegister);override;
  131. procedure a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);override;
  132. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister); override;
  133. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  134. procedure a_load_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const Ref: treference; reg: tregister);override;
  135. procedure a_load_const_reg(list: TAsmList; size: tcgsize; a: tcgint; reg: tregister);override;
  136. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  137. function handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference; override;
  138. end;
  139. tthumbcg64farm = class(tbasecg64farm)
  140. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  141. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  142. end;
  143. tthumb2cgarm = class(tcgarm)
  144. procedure init_register_allocators;override;
  145. procedure done_register_allocators;override;
  146. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  147. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  148. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  149. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  150. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  151. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  152. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  153. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  154. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  155. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; override;
  156. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  157. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  158. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  159. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  160. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  161. end;
  162. tthumb2cg64farm = class(tcg64farm)
  163. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  164. end;
  165. const
  166. OpCmp2AsmCond : Array[topcmp] of TAsmCond = (C_NONE,C_EQ,C_GT,
  167. C_LT,C_GE,C_LE,C_NE,C_LS,C_CC,C_CS,C_HI);
  168. winstackpagesize = 4096;
  169. function get_fpu_postfix(def : tdef) : toppostfix;
  170. procedure create_codegen;
  171. implementation
  172. uses
  173. globals,verbose,systems,cutils,
  174. aopt,aoptcpu,
  175. fmodule,
  176. symconst,symsym,symtable,
  177. tgobj,
  178. procinfo,cpupi,
  179. paramgr;
  180. function get_fpu_postfix(def : tdef) : toppostfix;
  181. begin
  182. if def.typ=floatdef then
  183. begin
  184. case tfloatdef(def).floattype of
  185. s32real:
  186. result:=PF_S;
  187. s64real:
  188. result:=PF_D;
  189. s80real:
  190. result:=PF_E;
  191. else
  192. internalerror(200401272);
  193. end;
  194. end
  195. else
  196. internalerror(200401271);
  197. end;
  198. procedure tarmcgarm.init_register_allocators;
  199. begin
  200. inherited init_register_allocators;
  201. { currently, we always save R14, so we can use it }
  202. if (target_info.system<>system_arm_darwin) then
  203. begin
  204. if assigned(current_procinfo) and (current_procinfo.framepointer<>NR_R11) then
  205. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  206. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  207. RS_R9,RS_R10,RS_R11,RS_R14],first_int_imreg,[])
  208. else
  209. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  210. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  211. RS_R9,RS_R10,RS_R14],first_int_imreg,[])
  212. end
  213. else
  214. { r7 is not available on Darwin, it's used as frame pointer (always,
  215. for backtrace support -- also in gcc/clang -> R11 can be used).
  216. r9 is volatile }
  217. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  218. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R9,RS_R12,RS_R4,RS_R5,RS_R6,RS_R8,
  219. RS_R10,RS_R11,RS_R14],first_int_imreg,[]);
  220. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  221. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  222. { The register allocator currently cannot deal with multiple
  223. non-overlapping subregs per register, so we can only use
  224. half the single precision registers for now (as sub registers of the
  225. double precision ones). }
  226. if current_settings.fputype=fpu_vfpv3 then
  227. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  228. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  229. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  230. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  231. ],first_mm_imreg,[])
  232. else
  233. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  234. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15],first_mm_imreg,[]);
  235. end;
  236. procedure tarmcgarm.done_register_allocators;
  237. begin
  238. rg[R_INTREGISTER].free;
  239. rg[R_FPUREGISTER].free;
  240. rg[R_MMREGISTER].free;
  241. inherited done_register_allocators;
  242. end;
  243. procedure tcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  244. var
  245. imm_shift : byte;
  246. l : tasmlabel;
  247. hr : treference;
  248. imm1, imm2: DWord;
  249. begin
  250. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  251. internalerror(2002090902);
  252. if is_shifter_const(a,imm_shift) then
  253. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  254. else if is_shifter_const(not(a),imm_shift) then
  255. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  256. { loading of constants with mov and orr }
  257. else if (split_into_shifter_const(a,imm1, imm2)) then
  258. begin
  259. list.concat(taicpu.op_reg_const(A_MOV,reg, imm1));
  260. list.concat(taicpu.op_reg_reg_const(A_ORR,reg,reg, imm2));
  261. end
  262. { loading of constants with mvn and bic }
  263. else if (split_into_shifter_const(not(a), imm1, imm2)) then
  264. begin
  265. list.concat(taicpu.op_reg_const(A_MVN,reg, imm1));
  266. list.concat(taicpu.op_reg_reg_const(A_BIC,reg,reg, imm2));
  267. end
  268. else
  269. begin
  270. reference_reset(hr,4);
  271. current_asmdata.getjumplabel(l);
  272. cg.a_label(current_procinfo.aktlocaldata,l);
  273. hr.symboldata:=current_procinfo.aktlocaldata.last;
  274. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  275. hr.symbol:=l;
  276. hr.base:=NR_PC;
  277. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  278. end;
  279. end;
  280. procedure tcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  281. var
  282. oppostfix:toppostfix;
  283. usedtmpref: treference;
  284. tmpreg,tmpreg2 : tregister;
  285. so : tshifterop;
  286. dir : integer;
  287. begin
  288. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  289. FromSize := ToSize;
  290. case FromSize of
  291. { signed integer registers }
  292. OS_8:
  293. oppostfix:=PF_B;
  294. OS_S8:
  295. oppostfix:=PF_SB;
  296. OS_16:
  297. oppostfix:=PF_H;
  298. OS_S16:
  299. oppostfix:=PF_SH;
  300. OS_32,
  301. OS_S32:
  302. oppostfix:=PF_None;
  303. else
  304. InternalError(200308297);
  305. end;
  306. if (fromsize=OS_S8) and
  307. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  308. oppostfix:=PF_B;
  309. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize])) or
  310. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  311. (oppostfix in [PF_SH,PF_H])) then
  312. begin
  313. if target_info.endian=endian_big then
  314. dir:=-1
  315. else
  316. dir:=1;
  317. case FromSize of
  318. OS_16,OS_S16:
  319. begin
  320. { only complicated references need an extra loadaddr }
  321. if assigned(ref.symbol) or
  322. (ref.index<>NR_NO) or
  323. (ref.offset<-4095) or
  324. (ref.offset>4094) or
  325. { sometimes the compiler reused registers }
  326. (reg=ref.index) or
  327. (reg=ref.base) then
  328. begin
  329. tmpreg2:=getintregister(list,OS_INT);
  330. a_loadaddr_ref_reg(list,ref,tmpreg2);
  331. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  332. end
  333. else
  334. usedtmpref:=ref;
  335. if target_info.endian=endian_big then
  336. inc(usedtmpref.offset,1);
  337. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  338. tmpreg:=getintregister(list,OS_INT);
  339. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  340. inc(usedtmpref.offset,dir);
  341. if FromSize=OS_16 then
  342. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  343. else
  344. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  345. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  346. end;
  347. OS_32,OS_S32:
  348. begin
  349. tmpreg:=getintregister(list,OS_INT);
  350. { only complicated references need an extra loadaddr }
  351. if assigned(ref.symbol) or
  352. (ref.index<>NR_NO) or
  353. (ref.offset<-4095) or
  354. (ref.offset>4092) or
  355. { sometimes the compiler reused registers }
  356. (reg=ref.index) or
  357. (reg=ref.base) then
  358. begin
  359. tmpreg2:=getintregister(list,OS_INT);
  360. a_loadaddr_ref_reg(list,ref,tmpreg2);
  361. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  362. end
  363. else
  364. usedtmpref:=ref;
  365. shifterop_reset(so);so.shiftmode:=SM_LSL;
  366. if ref.alignment=2 then
  367. begin
  368. if target_info.endian=endian_big then
  369. inc(usedtmpref.offset,2);
  370. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  371. inc(usedtmpref.offset,dir*2);
  372. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  373. so.shiftimm:=16;
  374. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  375. end
  376. else
  377. begin
  378. tmpreg2:=getintregister(list,OS_INT);
  379. if target_info.endian=endian_big then
  380. inc(usedtmpref.offset,3);
  381. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  382. inc(usedtmpref.offset,dir);
  383. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  384. inc(usedtmpref.offset,dir);
  385. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg2);
  386. so.shiftimm:=8;
  387. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  388. inc(usedtmpref.offset,dir);
  389. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  390. so.shiftimm:=16;
  391. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg2,so));
  392. so.shiftimm:=24;
  393. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  394. end;
  395. end
  396. else
  397. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  398. end;
  399. end
  400. else
  401. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  402. if (fromsize=OS_S8) and
  403. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  404. a_load_reg_reg(list,OS_S8,OS_32,reg,reg)
  405. else if (fromsize=OS_S8) and (tosize = OS_16) then
  406. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  407. end;
  408. procedure tcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  409. var
  410. hsym : tsym;
  411. href : treference;
  412. paraloc : Pcgparalocation;
  413. shift : byte;
  414. begin
  415. { calculate the parameter info for the procdef }
  416. procdef.init_paraloc_info(callerside);
  417. hsym:=tsym(procdef.parast.Find('self'));
  418. if not(assigned(hsym) and
  419. (hsym.typ=paravarsym)) then
  420. internalerror(200305251);
  421. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  422. while paraloc<>nil do
  423. with paraloc^ do
  424. begin
  425. case loc of
  426. LOC_REGISTER:
  427. begin
  428. if is_shifter_const(ioffset,shift) then
  429. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  430. else
  431. begin
  432. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  433. a_op_reg_reg(list,OP_SUB,size,NR_R12,register);
  434. end;
  435. end;
  436. LOC_REFERENCE:
  437. begin
  438. { offset in the wrapper needs to be adjusted for the stored
  439. return address }
  440. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),sizeof(pint));
  441. if is_shifter_const(ioffset,shift) then
  442. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  443. else
  444. begin
  445. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  446. a_op_reg_ref(list,OP_SUB,size,NR_R12,href);
  447. end;
  448. end
  449. else
  450. internalerror(200309189);
  451. end;
  452. paraloc:=next;
  453. end;
  454. end;
  455. procedure tbasecgarm.a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);
  456. var
  457. ref: treference;
  458. begin
  459. paraloc.check_simple_location;
  460. paramanager.allocparaloc(list,paraloc.location);
  461. case paraloc.location^.loc of
  462. LOC_REGISTER,LOC_CREGISTER:
  463. a_load_const_reg(list,size,a,paraloc.location^.register);
  464. LOC_REFERENCE:
  465. begin
  466. reference_reset(ref,paraloc.alignment);
  467. ref.base:=paraloc.location^.reference.index;
  468. ref.offset:=paraloc.location^.reference.offset;
  469. a_load_const_ref(list,size,a,ref);
  470. end;
  471. else
  472. internalerror(2002081101);
  473. end;
  474. end;
  475. procedure tbasecgarm.a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);
  476. var
  477. tmpref, ref: treference;
  478. location: pcgparalocation;
  479. sizeleft: aint;
  480. begin
  481. location := paraloc.location;
  482. tmpref := r;
  483. sizeleft := paraloc.intsize;
  484. while assigned(location) do
  485. begin
  486. paramanager.allocparaloc(list,location);
  487. case location^.loc of
  488. LOC_REGISTER,LOC_CREGISTER:
  489. a_load_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  490. LOC_REFERENCE:
  491. begin
  492. reference_reset_base(ref,location^.reference.index,location^.reference.offset,paraloc.alignment);
  493. { doubles in softemu mode have a strange order of registers and references }
  494. if location^.size=OS_32 then
  495. g_concatcopy(list,tmpref,ref,4)
  496. else
  497. begin
  498. g_concatcopy(list,tmpref,ref,sizeleft);
  499. if assigned(location^.next) then
  500. internalerror(2005010710);
  501. end;
  502. end;
  503. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  504. case location^.size of
  505. OS_F32, OS_F64:
  506. a_loadfpu_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  507. else
  508. internalerror(2002072801);
  509. end;
  510. LOC_VOID:
  511. begin
  512. // nothing to do
  513. end;
  514. else
  515. internalerror(2002081103);
  516. end;
  517. inc(tmpref.offset,tcgsize2size[location^.size]);
  518. dec(sizeleft,tcgsize2size[location^.size]);
  519. location := location^.next;
  520. end;
  521. end;
  522. procedure tbasecgarm.a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);
  523. var
  524. ref: treference;
  525. tmpreg: tregister;
  526. begin
  527. paraloc.check_simple_location;
  528. paramanager.allocparaloc(list,paraloc.location);
  529. case paraloc.location^.loc of
  530. LOC_REGISTER,LOC_CREGISTER:
  531. a_loadaddr_ref_reg(list,r,paraloc.location^.register);
  532. LOC_REFERENCE:
  533. begin
  534. reference_reset(ref,paraloc.alignment);
  535. ref.base := paraloc.location^.reference.index;
  536. ref.offset := paraloc.location^.reference.offset;
  537. tmpreg := getintregister(list,OS_ADDR);
  538. a_loadaddr_ref_reg(list,r,tmpreg);
  539. a_load_reg_ref(list,OS_ADDR,OS_ADDR,tmpreg,ref);
  540. end;
  541. else
  542. internalerror(2002080701);
  543. end;
  544. end;
  545. procedure tbasecgarm.a_call_name(list : TAsmList;const s : string; weak: boolean);
  546. var
  547. branchopcode: tasmop;
  548. r : treference;
  549. sym : TAsmSymbol;
  550. begin
  551. { check not really correct: should only be used for non-Thumb cpus }
  552. if (CPUARM_HAS_BLX_LABEL in cpu_capabilities[current_settings.cputype]) and
  553. { WinCE GNU AS (not sure if this applies in general) does not support BLX imm }
  554. (target_info.system<>system_arm_wince) then
  555. branchopcode:=A_BLX
  556. else
  557. branchopcode:=A_BL;
  558. if not(weak) then
  559. sym:=current_asmdata.RefAsmSymbol(s)
  560. else
  561. sym:=current_asmdata.WeakRefAsmSymbol(s);
  562. reference_reset_symbol(r,sym,0,sizeof(pint));
  563. if (tf_pic_uses_got in target_info.flags) and
  564. (cs_create_pic in current_settings.moduleswitches) then
  565. begin
  566. include(current_procinfo.flags,pi_needs_got);
  567. r.refaddr:=addr_pic
  568. end
  569. else
  570. r.refaddr:=addr_full;
  571. list.concat(taicpu.op_ref(branchopcode,r));
  572. {
  573. the compiler does not properly set this flag anymore in pass 1, and
  574. for now we only need it after pass 2 (I hope) (JM)
  575. if not(pi_do_call in current_procinfo.flags) then
  576. internalerror(2003060703);
  577. }
  578. include(current_procinfo.flags,pi_do_call);
  579. end;
  580. procedure tbasecgarm.a_call_reg(list : TAsmList;reg: tregister);
  581. begin
  582. { check not really correct: should only be used for non-Thumb cpus }
  583. if not(CPUARM_HAS_BLX in cpu_capabilities[current_settings.cputype]) then
  584. begin
  585. list.concat(taicpu.op_reg_reg(A_MOV,NR_R14,NR_PC));
  586. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,reg));
  587. end
  588. else
  589. list.concat(taicpu.op_reg(A_BLX, reg));
  590. {
  591. the compiler does not properly set this flag anymore in pass 1, and
  592. for now we only need it after pass 2 (I hope) (JM)
  593. if not(pi_do_call in current_procinfo.flags) then
  594. internalerror(2003060703);
  595. }
  596. include(current_procinfo.flags,pi_do_call);
  597. end;
  598. procedure tcgarm.a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister);
  599. begin
  600. a_op_const_reg_reg(list,op,size,a,reg,reg);
  601. end;
  602. procedure tcgarm.a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference);
  603. var
  604. tmpreg,tmpresreg : tregister;
  605. tmpref : treference;
  606. begin
  607. tmpreg:=getintregister(list,size);
  608. tmpresreg:=getintregister(list,size);
  609. tmpref:=a_internal_load_ref_reg(list,size,size,ref,tmpreg);
  610. a_op_const_reg_reg(list,op,size,a,tmpreg,tmpresreg);
  611. a_load_reg_ref(list,size,size,tmpresreg,tmpref);
  612. end;
  613. procedure tcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  614. var
  615. so : tshifterop;
  616. begin
  617. if op = OP_NEG then
  618. begin
  619. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,src,0));
  620. maybeadjustresult(list,OP_NEG,size,dst);
  621. end
  622. else if op = OP_NOT then
  623. begin
  624. if size in [OS_8, OS_16, OS_S8, OS_S16] then
  625. begin
  626. shifterop_reset(so);
  627. so.shiftmode:=SM_LSL;
  628. if size in [OS_8, OS_S8] then
  629. so.shiftimm:=24
  630. else
  631. so.shiftimm:=16;
  632. list.concat(taicpu.op_reg_reg_shifterop(A_MVN,dst,src,so));
  633. {Using a shift here allows this to be folded into another instruction}
  634. if size in [OS_S8, OS_S16] then
  635. so.shiftmode:=SM_ASR
  636. else
  637. so.shiftmode:=SM_LSR;
  638. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  639. end
  640. else
  641. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  642. end
  643. else
  644. a_op_reg_reg_reg(list,op,size,src,dst,dst);
  645. end;
  646. const
  647. op_reg_reg_opcg2asmop: array[TOpCG] of tasmop =
  648. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  649. A_NONE,A_NONE,A_NONE,A_SUB,A_EOR,A_NONE,A_NONE);
  650. op_reg_opcg2asmop: array[TOpCG] of tasmop =
  651. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  652. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  653. op_reg_postfix: array[TOpCG] of TOpPostfix =
  654. (PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,
  655. PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None);
  656. procedure tcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  657. size: tcgsize; a: tcgint; src, dst: tregister);
  658. var
  659. ovloc : tlocation;
  660. begin
  661. a_op_const_reg_reg_checkoverflow(list,op,size,a,src,dst,false,ovloc);
  662. end;
  663. procedure tcgarm.a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  664. size: tcgsize; src1, src2, dst: tregister);
  665. var
  666. ovloc : tlocation;
  667. begin
  668. a_op_reg_reg_reg_checkoverflow(list,op,size,src1,src2,dst,false,ovloc);
  669. end;
  670. function opshift2shiftmode(op: TOpCg): tshiftmode;
  671. begin
  672. case op of
  673. OP_SHL: Result:=SM_LSL;
  674. OP_SHR: Result:=SM_LSR;
  675. OP_ROR: Result:=SM_ROR;
  676. OP_ROL: Result:=SM_ROR;
  677. OP_SAR: Result:=SM_ASR;
  678. else internalerror(2012070501);
  679. end
  680. end;
  681. function tbasecgarm.try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  682. var
  683. multiplier : dword;
  684. power : longint;
  685. shifterop : tshifterop;
  686. bitsset : byte;
  687. negative : boolean;
  688. first : boolean;
  689. b,
  690. cycles : byte;
  691. maxeffort : byte;
  692. begin
  693. result:=true;
  694. cycles:=0;
  695. negative:=a<0;
  696. shifterop.rs:=NR_NO;
  697. shifterop.shiftmode:=SM_LSL;
  698. if negative then
  699. inc(cycles);
  700. multiplier:=dword(abs(a));
  701. bitsset:=popcnt(multiplier and $fffffffe);
  702. { heuristics to estimate how much instructions are reasonable to replace the mul,
  703. this is currently based on XScale timings }
  704. { in the simplest case, we need a mov to load the constant and a mul to carry out the
  705. actual multiplication, this requires min. 1+4 cycles
  706. because the first shift imm. might cause a stall and because we need more instructions
  707. when replacing the mul we generate max. 3 instructions to replace this mul }
  708. maxeffort:=3;
  709. { if the constant is not a shifter op, we need either some mov/mvn/bic/or sequence or
  710. a ldr, so generating one more operation to replace this is beneficial }
  711. if not(is_shifter_const(dword(a),b)) and not(is_shifter_const(not(dword(a)),b)) then
  712. inc(maxeffort);
  713. { if the upper 5 bits are all set or clear, mul is one cycle faster }
  714. if ((dword(a) and $f8000000)=0) or ((dword(a) and $f8000000)=$f8000000) then
  715. dec(maxeffort);
  716. { if the upper 17 bits are all set or clear, mul is another cycle faster }
  717. if ((dword(a) and $ffff8000)=0) or ((dword(a) and $ffff8000)=$ffff8000) then
  718. dec(maxeffort);
  719. { most simple cases }
  720. if a=1 then
  721. a_load_reg_reg(list,OS_32,OS_32,src,dst)
  722. else if a=0 then
  723. a_load_const_reg(list,OS_32,0,dst)
  724. else if a=-1 then
  725. a_op_reg_reg(list,OP_NEG,OS_32,src,dst)
  726. { add up ?
  727. basically, one add is needed for each bit being set in the constant factor
  728. however, the least significant bit is for free, it can be hidden in the initial
  729. instruction
  730. }
  731. else if (bitsset+cycles<=maxeffort) and
  732. (bitsset<=popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)) then
  733. begin
  734. first:=true;
  735. while multiplier<>0 do
  736. begin
  737. shifterop.shiftimm:=BsrDWord(multiplier);
  738. if odd(multiplier) then
  739. begin
  740. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,shifterop));
  741. dec(multiplier);
  742. end
  743. else
  744. if first then
  745. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  746. else
  747. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,src,shifterop));
  748. first:=false;
  749. dec(multiplier,1 shl shifterop.shiftimm);
  750. end;
  751. if negative then
  752. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  753. end
  754. { subtract from the next greater power of two? }
  755. else if popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)+cycles+1<=maxeffort then
  756. begin
  757. first:=true;
  758. while multiplier<>0 do
  759. begin
  760. if first then
  761. begin
  762. multiplier:=(1 shl power)-multiplier;
  763. shifterop.shiftimm:=power;
  764. end
  765. else
  766. shifterop.shiftimm:=BsrDWord(multiplier);
  767. if odd(multiplier) then
  768. begin
  769. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,shifterop));
  770. dec(multiplier);
  771. end
  772. else
  773. if first then
  774. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  775. else
  776. begin
  777. list.concat(taicpu.op_reg_reg_reg_shifterop(A_SUB,dst,dst,src,shifterop));
  778. dec(multiplier,1 shl shifterop.shiftimm);
  779. end;
  780. first:=false;
  781. end;
  782. if negative then
  783. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  784. end
  785. else
  786. result:=false;
  787. end;
  788. procedure tcgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  789. var
  790. shift, lsb, width : byte;
  791. tmpreg : tregister;
  792. so : tshifterop;
  793. l1 : longint;
  794. imm1, imm2: DWord;
  795. begin
  796. optimize_op_const(size, op, a);
  797. case op of
  798. OP_NONE:
  799. begin
  800. if src <> dst then
  801. a_load_reg_reg(list, size, size, src, dst);
  802. exit;
  803. end;
  804. OP_MOVE:
  805. begin
  806. a_load_const_reg(list, size, a, dst);
  807. exit;
  808. end;
  809. end;
  810. ovloc.loc:=LOC_VOID;
  811. if {$ifopt R+}(a<>-2147483648) and{$endif} not setflags and is_shifter_const(-a,shift) then
  812. case op of
  813. OP_ADD:
  814. begin
  815. op:=OP_SUB;
  816. a:=aint(dword(-a));
  817. end;
  818. OP_SUB:
  819. begin
  820. op:=OP_ADD;
  821. a:=aint(dword(-a));
  822. end
  823. end;
  824. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  825. case op of
  826. OP_NEG,OP_NOT:
  827. internalerror(200308281);
  828. OP_SHL,
  829. OP_SHR,
  830. OP_ROL,
  831. OP_ROR,
  832. OP_SAR:
  833. begin
  834. if a>32 then
  835. internalerror(200308294);
  836. shifterop_reset(so);
  837. so.shiftmode:=opshift2shiftmode(op);
  838. if op = OP_ROL then
  839. so.shiftimm:=32-a
  840. else
  841. so.shiftimm:=a;
  842. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  843. end;
  844. else
  845. {if (op in [OP_SUB, OP_ADD]) and
  846. ((a < 0) or
  847. (a > 4095)) then
  848. begin
  849. tmpreg:=getintregister(list,size);
  850. list.concat(taicpu.op_reg_const(A_MOVT, tmpreg, (a shr 16) and $FFFF));
  851. list.concat(taicpu.op_reg_const(A_MOV, tmpreg, a and $FFFF));
  852. list.concat(setoppostfix(taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))
  853. ));
  854. end
  855. else}
  856. begin
  857. if cgsetflags or setflags then
  858. a_reg_alloc(list,NR_DEFAULTFLAGS);
  859. list.concat(setoppostfix(
  860. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  861. end;
  862. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  863. begin
  864. ovloc.loc:=LOC_FLAGS;
  865. case op of
  866. OP_ADD:
  867. ovloc.resflags:=F_CS;
  868. OP_SUB:
  869. ovloc.resflags:=F_CC;
  870. end;
  871. end;
  872. end
  873. else
  874. begin
  875. { there could be added some more sophisticated optimizations }
  876. if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  877. a_op_reg_reg(list,OP_NEG,size,src,dst)
  878. { we do this here instead in the peephole optimizer because
  879. it saves us a register }
  880. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  881. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  882. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  883. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  884. begin
  885. if l1>32 then{roozbeh does this ever happen?}
  886. internalerror(200308296);
  887. shifterop_reset(so);
  888. so.shiftmode:=SM_LSL;
  889. so.shiftimm:=l1;
  890. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  891. end
  892. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  893. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  894. begin
  895. if l1>32 then{does this ever happen?}
  896. internalerror(201205181);
  897. shifterop_reset(so);
  898. so.shiftmode:=SM_LSL;
  899. so.shiftimm:=l1;
  900. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  901. end
  902. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  903. begin
  904. { nothing to do on success }
  905. end
  906. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  907. broader range of shifterconstants.}
  908. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  909. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  910. { Doing two shifts instead of two bics might allow the peephole optimizer to fold the second shift
  911. into the following instruction}
  912. else if (op = OP_AND) and
  913. is_continuous_mask(a, lsb, width) and
  914. ((lsb = 0) or ((lsb + width) = 32)) then
  915. begin
  916. shifterop_reset(so);
  917. if (width = 16) and
  918. (lsb = 0) and
  919. (current_settings.cputype >= cpu_armv6) then
  920. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  921. else if (width = 8) and
  922. (lsb = 0) and
  923. (current_settings.cputype >= cpu_armv6) then
  924. list.concat(taicpu.op_reg_reg(A_UXTB,dst,src))
  925. else if lsb = 0 then
  926. begin
  927. so.shiftmode:=SM_LSL;
  928. so.shiftimm:=32-width;
  929. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  930. so.shiftmode:=SM_LSR;
  931. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  932. end
  933. else
  934. begin
  935. so.shiftmode:=SM_LSR;
  936. so.shiftimm:=lsb;
  937. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  938. so.shiftmode:=SM_LSL;
  939. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  940. end;
  941. end
  942. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  943. begin
  944. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,imm1));
  945. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  946. end
  947. else if (op in [OP_ADD, OP_SUB, OP_OR, OP_XOR]) and
  948. not(cgsetflags or setflags) and
  949. split_into_shifter_const(a, imm1, imm2) then
  950. begin
  951. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,imm1));
  952. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  953. end
  954. else
  955. begin
  956. tmpreg:=getintregister(list,size);
  957. a_load_const_reg(list,size,a,tmpreg);
  958. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  959. end;
  960. end;
  961. maybeadjustresult(list,op,size,dst);
  962. end;
  963. procedure tcgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  964. var
  965. so : tshifterop;
  966. tmpreg,overflowreg : tregister;
  967. asmop : tasmop;
  968. begin
  969. ovloc.loc:=LOC_VOID;
  970. case op of
  971. OP_NEG,OP_NOT,
  972. OP_DIV,OP_IDIV:
  973. internalerror(200308283);
  974. OP_SHL,
  975. OP_SHR,
  976. OP_SAR,
  977. OP_ROR:
  978. begin
  979. if (op = OP_ROR) and not(size in [OS_32,OS_S32]) then
  980. internalerror(2008072801);
  981. shifterop_reset(so);
  982. so.rs:=src1;
  983. so.shiftmode:=opshift2shiftmode(op);
  984. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  985. end;
  986. OP_ROL:
  987. begin
  988. if not(size in [OS_32,OS_S32]) then
  989. internalerror(2008072801);
  990. { simulate ROL by ror'ing 32-value }
  991. tmpreg:=getintregister(list,OS_32);
  992. list.concat(taicpu.op_reg_reg_const(A_RSB,tmpreg,src1, 32));
  993. shifterop_reset(so);
  994. so.rs:=tmpreg;
  995. so.shiftmode:=SM_ROR;
  996. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  997. end;
  998. OP_IMUL,
  999. OP_MUL:
  1000. begin
  1001. if (cgsetflags or setflags) and
  1002. (CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype]) then
  1003. begin
  1004. overflowreg:=getintregister(list,size);
  1005. if op=OP_IMUL then
  1006. asmop:=A_SMULL
  1007. else
  1008. asmop:=A_UMULL;
  1009. { the arm doesn't allow that rd and rm are the same }
  1010. if dst=src2 then
  1011. begin
  1012. if dst<>src1 then
  1013. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  1014. else
  1015. begin
  1016. tmpreg:=getintregister(list,size);
  1017. a_load_reg_reg(list,size,size,src2,dst);
  1018. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  1019. end;
  1020. end
  1021. else
  1022. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  1023. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1024. if op=OP_IMUL then
  1025. begin
  1026. shifterop_reset(so);
  1027. so.shiftmode:=SM_ASR;
  1028. so.shiftimm:=31;
  1029. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  1030. end
  1031. else
  1032. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  1033. ovloc.loc:=LOC_FLAGS;
  1034. ovloc.resflags:=F_NE;
  1035. end
  1036. else
  1037. begin
  1038. { the arm doesn't allow that rd and rm are the same }
  1039. if dst=src2 then
  1040. begin
  1041. if dst<>src1 then
  1042. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  1043. else
  1044. begin
  1045. tmpreg:=getintregister(list,size);
  1046. a_load_reg_reg(list,size,size,src2,dst);
  1047. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  1048. end;
  1049. end
  1050. else
  1051. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  1052. end;
  1053. end;
  1054. else
  1055. begin
  1056. if cgsetflags or setflags then
  1057. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1058. list.concat(setoppostfix(
  1059. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  1060. end;
  1061. end;
  1062. maybeadjustresult(list,op,size,dst);
  1063. end;
  1064. procedure tcgarm.a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister);
  1065. var
  1066. asmop: tasmop;
  1067. begin
  1068. if CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype] then
  1069. begin
  1070. list.concat(tai_comment.create(strpnew('tcgarm.a_mul_reg_reg_pair called')));
  1071. case size of
  1072. OS_32: asmop:=A_UMULL;
  1073. OS_S32: asmop:=A_SMULL;
  1074. else
  1075. InternalError(2014060802);
  1076. end;
  1077. { The caller might omit dstlo or dsthi, when he is not interested in it, we still
  1078. need valid registers everywhere. In case of dsthi = NR_NO we could fall back to
  1079. 32x32=32 bit multiplication}
  1080. if (dstlo = NR_NO) then
  1081. dstlo:=getintregister(list,size);
  1082. if (dsthi = NR_NO) then
  1083. dsthi:=getintregister(list,size);
  1084. list.concat(taicpu.op_reg_reg_reg_reg(asmop, dstlo, dsthi, src1,src2));
  1085. end
  1086. else if dsthi=NR_NO then
  1087. begin
  1088. if (dstlo = NR_NO) then
  1089. dstlo:=getintregister(list,size);
  1090. list.concat(taicpu.op_reg_reg_reg(A_MUL, dstlo, src1,src2));
  1091. end
  1092. else
  1093. begin
  1094. internalerror(2015083022);
  1095. end;
  1096. end;
  1097. function tbasecgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  1098. var
  1099. tmpreg1,tmpreg2 : tregister;
  1100. tmpref : treference;
  1101. l : tasmlabel;
  1102. begin
  1103. tmpreg1:=NR_NO;
  1104. { Be sure to have a base register }
  1105. if (ref.base=NR_NO) then
  1106. begin
  1107. if ref.shiftmode<>SM_None then
  1108. internalerror(2014020701);
  1109. ref.base:=ref.index;
  1110. ref.index:=NR_NO;
  1111. end;
  1112. { absolute symbols can't be handled directly, we've to store the symbol reference
  1113. in the text segment and access it pc relative
  1114. For now, we assume that references where base or index equals to PC are already
  1115. relative, all other references are assumed to be absolute and thus they need
  1116. to be handled extra.
  1117. A proper solution would be to change refoptions to a set and store the information
  1118. if the symbol is absolute or relative there.
  1119. }
  1120. if (assigned(ref.symbol) and
  1121. not(is_pc(ref.base)) and
  1122. not(is_pc(ref.index))
  1123. ) or
  1124. { [#xxx] isn't a valid address operand }
  1125. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  1126. (ref.offset<-4095) or
  1127. (ref.offset>4095) or
  1128. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  1129. ((ref.offset<-255) or
  1130. (ref.offset>255)
  1131. )
  1132. ) or
  1133. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1134. ((ref.offset<-1020) or
  1135. (ref.offset>1020) or
  1136. ((abs(ref.offset) mod 4)<>0)
  1137. )
  1138. ) or
  1139. ((GenerateThumbCode) and
  1140. (((oppostfix in [PF_SB,PF_SH]) and (ref.offset<>0)) or
  1141. ((oppostfix=PF_None) and ((ref.offset<0) or ((ref.base<>NR_STACK_POINTER_REG) and (ref.offset>124)) or
  1142. ((ref.base=NR_STACK_POINTER_REG) and (ref.offset>1020)) or ((ref.offset mod 4)<>0))) or
  1143. ((oppostfix=PF_H) and ((ref.offset<0) or (ref.offset>62) or ((ref.offset mod 2)<>0) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0)))) or
  1144. ((oppostfix=PF_B) and ((ref.offset<0) or (ref.offset>31) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0))))
  1145. )
  1146. ) then
  1147. begin
  1148. fixref(list,ref);
  1149. end;
  1150. if GenerateThumbCode then
  1151. begin
  1152. { certain thumb load require base and index }
  1153. if (oppostfix in [PF_SB,PF_SH]) and
  1154. (ref.base<>NR_NO) and (ref.index=NR_NO) then
  1155. begin
  1156. tmpreg1:=getintregister(list,OS_ADDR);
  1157. a_load_const_reg(list,OS_ADDR,0,tmpreg1);
  1158. ref.index:=tmpreg1;
  1159. end;
  1160. { "hi" registers cannot be used as base or index }
  1161. if (getsupreg(ref.base) in [RS_R8..RS_R12,RS_R14]) or
  1162. ((ref.base=NR_R13) and (ref.index<>NR_NO)) then
  1163. begin
  1164. tmpreg1:=getintregister(list,OS_ADDR);
  1165. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.base,tmpreg1);
  1166. ref.base:=tmpreg1;
  1167. end;
  1168. if getsupreg(ref.index) in [RS_R8..RS_R14] then
  1169. begin
  1170. tmpreg1:=getintregister(list,OS_ADDR);
  1171. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.index,tmpreg1);
  1172. ref.index:=tmpreg1;
  1173. end;
  1174. end;
  1175. { fold if there is base, index and offset, however, don't fold
  1176. for vfp memory instructions because we later fold the index }
  1177. if not((op in [A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1178. (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  1179. begin
  1180. if tmpreg1<>NR_NO then
  1181. begin
  1182. tmpreg2:=getintregister(list,OS_ADDR);
  1183. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg1,tmpreg2);
  1184. tmpreg1:=tmpreg2;
  1185. end
  1186. else
  1187. begin
  1188. tmpreg1:=getintregister(list,OS_ADDR);
  1189. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg1);
  1190. ref.base:=tmpreg1;
  1191. end;
  1192. ref.offset:=0;
  1193. end;
  1194. { floating point operations have only limited references
  1195. we expect here, that a base is already set }
  1196. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  1197. begin
  1198. if ref.shiftmode<>SM_none then
  1199. internalerror(200309121);
  1200. if tmpreg1<>NR_NO then
  1201. begin
  1202. if ref.base=tmpreg1 then
  1203. begin
  1204. if ref.signindex<0 then
  1205. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,tmpreg1,ref.index))
  1206. else
  1207. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,tmpreg1,ref.index));
  1208. ref.index:=NR_NO;
  1209. end
  1210. else
  1211. begin
  1212. if ref.index<>tmpreg1 then
  1213. internalerror(200403161);
  1214. if ref.signindex<0 then
  1215. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,ref.base,tmpreg1))
  1216. else
  1217. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,tmpreg1));
  1218. ref.base:=tmpreg1;
  1219. ref.index:=NR_NO;
  1220. end;
  1221. end
  1222. else
  1223. begin
  1224. tmpreg1:=getintregister(list,OS_ADDR);
  1225. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,ref.index));
  1226. ref.base:=tmpreg1;
  1227. ref.index:=NR_NO;
  1228. end;
  1229. end;
  1230. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  1231. Result := ref;
  1232. end;
  1233. procedure tbasecgarm.a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);
  1234. var
  1235. oppostfix:toppostfix;
  1236. usedtmpref: treference;
  1237. tmpreg : tregister;
  1238. dir : integer;
  1239. begin
  1240. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  1241. FromSize := ToSize;
  1242. case ToSize of
  1243. { signed integer registers }
  1244. OS_8,
  1245. OS_S8:
  1246. oppostfix:=PF_B;
  1247. OS_16,
  1248. OS_S16:
  1249. oppostfix:=PF_H;
  1250. OS_32,
  1251. OS_S32,
  1252. { for vfp value stored in integer register }
  1253. OS_F32:
  1254. oppostfix:=PF_None;
  1255. else
  1256. InternalError(200308299);
  1257. end;
  1258. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[tosize])) or
  1259. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  1260. (oppostfix =PF_H)) then
  1261. begin
  1262. if target_info.endian=endian_big then
  1263. dir:=-1
  1264. else
  1265. dir:=1;
  1266. case FromSize of
  1267. OS_16,OS_S16:
  1268. begin
  1269. tmpreg:=getintregister(list,OS_INT);
  1270. usedtmpref:=ref;
  1271. if target_info.endian=endian_big then
  1272. inc(usedtmpref.offset,1);
  1273. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1274. inc(usedtmpref.offset,dir);
  1275. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1276. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1277. end;
  1278. OS_32,OS_S32:
  1279. begin
  1280. tmpreg:=getintregister(list,OS_INT);
  1281. usedtmpref:=ref;
  1282. if ref.alignment=2 then
  1283. begin
  1284. if target_info.endian=endian_big then
  1285. inc(usedtmpref.offset,2);
  1286. usedtmpref:=a_internal_load_reg_ref(list,OS_16,OS_16,reg,usedtmpref);
  1287. a_op_const_reg_reg(list,OP_SHR,OS_INT,16,reg,tmpreg);
  1288. inc(usedtmpref.offset,dir*2);
  1289. a_internal_load_reg_ref(list,OS_16,OS_16,tmpreg,usedtmpref);
  1290. end
  1291. else
  1292. begin
  1293. if target_info.endian=endian_big then
  1294. inc(usedtmpref.offset,3);
  1295. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1296. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1297. inc(usedtmpref.offset,dir);
  1298. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1299. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1300. inc(usedtmpref.offset,dir);
  1301. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1302. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1303. inc(usedtmpref.offset,dir);
  1304. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1305. end;
  1306. end
  1307. else
  1308. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1309. end;
  1310. end
  1311. else
  1312. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1313. end;
  1314. function tbasecgarm.a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  1315. var
  1316. oppostfix:toppostfix;
  1317. href: treference;
  1318. tmpreg: TRegister;
  1319. begin
  1320. case ToSize of
  1321. { signed integer registers }
  1322. OS_8,
  1323. OS_S8:
  1324. oppostfix:=PF_B;
  1325. OS_16,
  1326. OS_S16:
  1327. oppostfix:=PF_H;
  1328. OS_32,
  1329. OS_S32:
  1330. oppostfix:=PF_None;
  1331. else
  1332. InternalError(2003082910);
  1333. end;
  1334. if (tosize in [OS_S16,OS_16]) and
  1335. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1336. begin
  1337. result:=handle_load_store(list,A_STR,PF_B,reg,ref);
  1338. tmpreg:=getintregister(list,OS_INT);
  1339. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1340. href:=result;
  1341. inc(href.offset);
  1342. handle_load_store(list,A_STR,PF_B,tmpreg,href);
  1343. end
  1344. else
  1345. result:=handle_load_store(list,A_STR,oppostfix,reg,ref);
  1346. end;
  1347. function tbasecgarm.a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  1348. var
  1349. oppostfix:toppostfix;
  1350. so: tshifterop;
  1351. tmpreg: TRegister;
  1352. href: treference;
  1353. begin
  1354. case FromSize of
  1355. { signed integer registers }
  1356. OS_8:
  1357. oppostfix:=PF_B;
  1358. OS_S8:
  1359. oppostfix:=PF_SB;
  1360. OS_16:
  1361. oppostfix:=PF_H;
  1362. OS_S16:
  1363. oppostfix:=PF_SH;
  1364. OS_32,
  1365. OS_S32:
  1366. oppostfix:=PF_None;
  1367. else
  1368. InternalError(200308291);
  1369. end;
  1370. if (tosize=OS_S8) and
  1371. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1372. begin
  1373. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1374. a_load_reg_reg(list,OS_S8,OS_32,reg,reg);
  1375. end
  1376. else if (tosize in [OS_S16,OS_16]) and
  1377. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1378. begin
  1379. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1380. tmpreg:=getintregister(list,OS_INT);
  1381. href:=result;
  1382. inc(href.offset);
  1383. handle_load_store(list,A_LDR,PF_B,tmpreg,href);
  1384. shifterop_reset(so);
  1385. so.shiftmode:=SM_LSL;
  1386. so.shiftimm:=8;
  1387. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  1388. end
  1389. else
  1390. result:=handle_load_store(list,A_LDR,oppostfix,reg,ref);
  1391. end;
  1392. procedure tbasecgarm.a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);
  1393. var
  1394. so : tshifterop;
  1395. procedure do_shift(shiftmode : tshiftmode; shiftimm : byte; reg : tregister);
  1396. begin
  1397. if GenerateThumbCode then
  1398. begin
  1399. case shiftmode of
  1400. SM_ASR:
  1401. a_op_const_reg_reg(list,OP_SAR,OS_32,shiftimm,reg,reg2);
  1402. SM_LSR:
  1403. a_op_const_reg_reg(list,OP_SHR,OS_32,shiftimm,reg,reg2);
  1404. SM_LSL:
  1405. a_op_const_reg_reg(list,OP_SHL,OS_32,shiftimm,reg,reg2);
  1406. else
  1407. internalerror(2013090301);
  1408. end;
  1409. end
  1410. else
  1411. begin
  1412. so.shiftmode:=shiftmode;
  1413. so.shiftimm:=shiftimm;
  1414. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,reg2,reg,so));
  1415. end;
  1416. end;
  1417. var
  1418. instr: taicpu;
  1419. conv_done: boolean;
  1420. begin
  1421. if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then
  1422. internalerror(2002090901);
  1423. conv_done:=false;
  1424. if tosize<>fromsize then
  1425. begin
  1426. shifterop_reset(so);
  1427. conv_done:=true;
  1428. if tcgsize2size[tosize]<=tcgsize2size[fromsize] then
  1429. fromsize:=tosize;
  1430. if current_settings.cputype<cpu_armv6 then
  1431. case fromsize of
  1432. OS_8:
  1433. if GenerateThumbCode then
  1434. a_op_const_reg_reg(list,OP_AND,OS_32,$ff,reg1,reg2)
  1435. else
  1436. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1437. OS_S8:
  1438. begin
  1439. do_shift(SM_LSL,24,reg1);
  1440. if tosize=OS_16 then
  1441. begin
  1442. do_shift(SM_ASR,8,reg2);
  1443. do_shift(SM_LSR,16,reg2);
  1444. end
  1445. else
  1446. do_shift(SM_ASR,24,reg2);
  1447. end;
  1448. OS_16:
  1449. begin
  1450. do_shift(SM_LSL,16,reg1);
  1451. do_shift(SM_LSR,16,reg2);
  1452. end;
  1453. OS_S16:
  1454. begin
  1455. do_shift(SM_LSL,16,reg1);
  1456. do_shift(SM_ASR,16,reg2)
  1457. end;
  1458. else
  1459. conv_done:=false;
  1460. end
  1461. else
  1462. case fromsize of
  1463. OS_8:
  1464. if GenerateThumbCode then
  1465. list.concat(taicpu.op_reg_reg(A_UXTB,reg2,reg1))
  1466. else
  1467. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1468. OS_S8:
  1469. begin
  1470. if tosize=OS_16 then
  1471. begin
  1472. so.shiftmode:=SM_ROR;
  1473. so.shiftimm:=16;
  1474. list.concat(taicpu.op_reg_reg_shifterop(A_SXTB16,reg2,reg1,so));
  1475. do_shift(SM_LSR,16,reg2);
  1476. end
  1477. else
  1478. list.concat(taicpu.op_reg_reg(A_SXTB,reg2,reg1));
  1479. end;
  1480. OS_16:
  1481. list.concat(taicpu.op_reg_reg(A_UXTH,reg2,reg1));
  1482. OS_S16:
  1483. list.concat(taicpu.op_reg_reg(A_SXTH,reg2,reg1));
  1484. else
  1485. conv_done:=false;
  1486. end
  1487. end;
  1488. if not conv_done and (reg1<>reg2) then
  1489. begin
  1490. { same size, only a register mov required }
  1491. instr:=taicpu.op_reg_reg(A_MOV,reg2,reg1);
  1492. list.Concat(instr);
  1493. { Notify the register allocator that we have written a move instruction so
  1494. it can try to eliminate it. }
  1495. add_move_instruction(instr);
  1496. end;
  1497. end;
  1498. procedure tbasecgarm.a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);
  1499. var
  1500. href,href2 : treference;
  1501. hloc : pcgparalocation;
  1502. begin
  1503. href:=ref;
  1504. hloc:=paraloc.location;
  1505. while assigned(hloc) do
  1506. begin
  1507. case hloc^.loc of
  1508. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  1509. begin
  1510. paramanager.allocparaloc(list,paraloc.location);
  1511. a_loadfpu_ref_reg(list,size,size,ref,hloc^.register);
  1512. end;
  1513. LOC_REGISTER :
  1514. case hloc^.size of
  1515. OS_32,
  1516. OS_F32:
  1517. begin
  1518. paramanager.allocparaloc(list,paraloc.location);
  1519. a_load_ref_reg(list,OS_32,OS_32,href,hloc^.register);
  1520. end;
  1521. OS_64,
  1522. OS_F64:
  1523. cg64.a_load64_ref_cgpara(list,href,paraloc);
  1524. else
  1525. a_load_ref_reg(list,hloc^.size,hloc^.size,href,hloc^.register);
  1526. end;
  1527. LOC_REFERENCE :
  1528. begin
  1529. reference_reset_base(href2,hloc^.reference.index,hloc^.reference.offset,paraloc.alignment);
  1530. { concatcopy should choose the best way to copy the data }
  1531. g_concatcopy(list,href,href2,tcgsize2size[hloc^.size]);
  1532. end;
  1533. else
  1534. internalerror(200408241);
  1535. end;
  1536. inc(href.offset,tcgsize2size[hloc^.size]);
  1537. hloc:=hloc^.next;
  1538. end;
  1539. end;
  1540. procedure tbasecgarm.a_loadfpu_reg_reg(list: TAsmList; fromsize,tosize: tcgsize; reg1, reg2: tregister);
  1541. begin
  1542. list.concat(setoppostfix(taicpu.op_reg_reg(A_MVF,reg2,reg1),cgsize2fpuoppostfix[tosize]));
  1543. end;
  1544. procedure tbasecgarm.a_loadfpu_ref_reg(list: TAsmList; fromsize,tosize: tcgsize; const ref: treference; reg: tregister);
  1545. var
  1546. oppostfix:toppostfix;
  1547. begin
  1548. case fromsize of
  1549. OS_32,
  1550. OS_F32:
  1551. oppostfix:=PF_S;
  1552. OS_64,
  1553. OS_F64:
  1554. oppostfix:=PF_D;
  1555. OS_F80:
  1556. oppostfix:=PF_E;
  1557. else
  1558. InternalError(200309021);
  1559. end;
  1560. handle_load_store(list,A_LDF,oppostfix,reg,ref);
  1561. if fromsize<>tosize then
  1562. a_loadfpu_reg_reg(list,fromsize,tosize,reg,reg);
  1563. end;
  1564. procedure tbasecgarm.a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);
  1565. var
  1566. oppostfix:toppostfix;
  1567. begin
  1568. case tosize of
  1569. OS_F32:
  1570. oppostfix:=PF_S;
  1571. OS_F64:
  1572. oppostfix:=PF_D;
  1573. OS_F80:
  1574. oppostfix:=PF_E;
  1575. else
  1576. InternalError(200309022);
  1577. end;
  1578. handle_load_store(list,A_STF,oppostfix,reg,ref);
  1579. end;
  1580. { comparison operations }
  1581. procedure tbasecgarm.a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  1582. l : tasmlabel);
  1583. var
  1584. tmpreg : tregister;
  1585. b : byte;
  1586. begin
  1587. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1588. if (not(GenerateThumbCode) and is_shifter_const(a,b)) or
  1589. ((GenerateThumbCode) and is_thumb_imm(a)) then
  1590. list.concat(taicpu.op_reg_const(A_CMP,reg,a))
  1591. { CMN reg,0 and CMN reg,$80000000 are different from CMP reg,$ffffffff
  1592. and CMP reg,$7fffffff regarding the flags according to the ARM manual }
  1593. else if (a<>$7fffffff) and (a<>-1) and not(GenerateThumbCode) and is_shifter_const(-a,b) then
  1594. list.concat(taicpu.op_reg_const(A_CMN,reg,-a))
  1595. else
  1596. begin
  1597. tmpreg:=getintregister(list,size);
  1598. a_load_const_reg(list,size,a,tmpreg);
  1599. list.concat(taicpu.op_reg_reg(A_CMP,reg,tmpreg));
  1600. end;
  1601. a_jmp_cond(list,cmp_op,l);
  1602. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1603. end;
  1604. procedure tbasecgarm.a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister);
  1605. begin
  1606. if reverse then
  1607. begin
  1608. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,src));
  1609. list.Concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,31));
  1610. list.Concat(taicpu.op_reg_reg_const(A_AND,dst,dst,255));
  1611. end
  1612. { it is decided during the compilation of the system unit if this code is used or not
  1613. so no additional check for rbit is needed }
  1614. else
  1615. begin
  1616. list.Concat(taicpu.op_reg_reg(A_RBIT,dst,src));
  1617. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,dst));
  1618. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1619. list.Concat(taicpu.op_reg_const(A_CMP,dst,32));
  1620. if GenerateThumb2Code then
  1621. list.Concat(taicpu.op_cond(A_IT, C_EQ));
  1622. list.Concat(setcondition(taicpu.op_reg_const(A_MOV,dst,$ff),C_EQ));
  1623. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1624. end;
  1625. end;
  1626. procedure tbasecgarm.a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel);
  1627. begin
  1628. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1629. list.concat(taicpu.op_reg_reg(A_CMP,reg2,reg1));
  1630. a_jmp_cond(list,cmp_op,l);
  1631. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1632. end;
  1633. procedure tbasecgarm.a_jmp_name(list : TAsmList;const s : string);
  1634. var
  1635. ai : taicpu;
  1636. begin
  1637. { generate far jump, leave it to the optimizer to get rid of it }
  1638. if GenerateThumbCode then
  1639. ai:=taicpu.op_sym(A_BL,current_asmdata.RefAsmSymbol(s))
  1640. else
  1641. ai:=taicpu.op_sym(A_B,current_asmdata.RefAsmSymbol(s));
  1642. ai.is_jmp:=true;
  1643. list.concat(ai);
  1644. end;
  1645. procedure tbasecgarm.a_jmp_always(list : TAsmList;l: tasmlabel);
  1646. var
  1647. ai : taicpu;
  1648. begin
  1649. { generate far jump, leave it to the optimizer to get rid of it }
  1650. if GenerateThumbCode then
  1651. ai:=taicpu.op_sym(A_BL,l)
  1652. else
  1653. ai:=taicpu.op_sym(A_B,l);
  1654. ai.is_jmp:=true;
  1655. list.concat(ai);
  1656. end;
  1657. procedure tbasecgarm.a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel);
  1658. var
  1659. ai : taicpu;
  1660. inv_flags : TResFlags;
  1661. hlabel : TAsmLabel;
  1662. begin
  1663. if GenerateThumbCode then
  1664. begin
  1665. inv_flags:=f;
  1666. inverse_flags(inv_flags);
  1667. { the optimizer has to fix this if jump range is sufficient short }
  1668. current_asmdata.getjumplabel(hlabel);
  1669. ai:=setcondition(taicpu.op_sym(A_B,hlabel),flags_to_cond(inv_flags));
  1670. ai.is_jmp:=true;
  1671. list.concat(ai);
  1672. a_jmp_always(list,l);
  1673. a_label(list,hlabel);
  1674. end
  1675. else
  1676. begin
  1677. ai:=setcondition(taicpu.op_sym(A_B,l),flags_to_cond(f));
  1678. ai.is_jmp:=true;
  1679. list.concat(ai);
  1680. end;
  1681. end;
  1682. procedure tbasecgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  1683. begin
  1684. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  1685. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  1686. end;
  1687. procedure tbasecgarm.g_profilecode(list : TAsmList);
  1688. begin
  1689. if target_info.system = system_arm_linux then
  1690. begin
  1691. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R14]));
  1692. a_call_name(list,'__gnu_mcount_nc',false);
  1693. end
  1694. else
  1695. internalerror(2014091201);
  1696. end;
  1697. procedure tbasecgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  1698. var
  1699. ref : treference;
  1700. shift : byte;
  1701. firstfloatreg,lastfloatreg,
  1702. r : byte;
  1703. mmregs,
  1704. regs, saveregs : tcpuregisterset;
  1705. registerarea,
  1706. r7offset,
  1707. stackmisalignment : pint;
  1708. postfix: toppostfix;
  1709. imm1, imm2: DWord;
  1710. stack_parameters : Boolean;
  1711. begin
  1712. LocalSize:=align(LocalSize,4);
  1713. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  1714. { call instruction does not put anything on the stack }
  1715. registerarea:=0;
  1716. tarmprocinfo(current_procinfo).stackpaddingreg:=High(TSuperRegister);
  1717. lastfloatreg:=RS_NO;
  1718. if not(nostackframe) then
  1719. begin
  1720. firstfloatreg:=RS_NO;
  1721. mmregs:=[];
  1722. case current_settings.fputype of
  1723. fpu_fpa,
  1724. fpu_fpa10,
  1725. fpu_fpa11:
  1726. begin
  1727. { save floating point registers? }
  1728. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1729. for r:=RS_F0 to RS_F7 do
  1730. if r in regs then
  1731. begin
  1732. if firstfloatreg=RS_NO then
  1733. firstfloatreg:=r;
  1734. lastfloatreg:=r;
  1735. inc(registerarea,12);
  1736. end;
  1737. end;
  1738. fpu_vfpv2,
  1739. fpu_vfpv3,
  1740. fpu_vfpv3_d16:
  1741. begin;
  1742. mmregs:=rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall);
  1743. end;
  1744. end;
  1745. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1746. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1747. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  1748. { save int registers }
  1749. reference_reset(ref,4);
  1750. ref.index:=NR_STACK_POINTER_REG;
  1751. ref.addressmode:=AM_PREINDEXED;
  1752. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  1753. if not(target_info.system in systems_darwin) then
  1754. begin
  1755. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1756. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1757. begin
  1758. a_reg_alloc(list,NR_R12);
  1759. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  1760. end;
  1761. { the (old) ARM APCS requires saving both the stack pointer (to
  1762. crawl the stack) and the PC (to identify the function this
  1763. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  1764. and R15 -- still needs updating for EABI and Darwin, they don't
  1765. need that }
  1766. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1767. regs:=regs+[RS_FRAME_POINTER_REG,RS_R12,RS_R14,RS_R15]
  1768. else
  1769. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1770. include(regs,RS_R14);
  1771. if regs<>[] then
  1772. begin
  1773. for r:=RS_R0 to RS_R15 do
  1774. if r in regs then
  1775. inc(registerarea,4);
  1776. { if the stack is not 8 byte aligned, try to add an extra register,
  1777. so we can avoid the extra sub/add ...,#4 later (KB) }
  1778. if ((registerarea mod current_settings.alignment.localalignmax) <> 0) then
  1779. for r:=RS_R3 downto RS_R0 do
  1780. if not(r in regs) then
  1781. begin
  1782. regs:=regs+[r];
  1783. inc(registerarea,4);
  1784. tarmprocinfo(current_procinfo).stackpaddingreg:=r;
  1785. break;
  1786. end;
  1787. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  1788. end;
  1789. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1790. begin
  1791. { the framepointer now points to the saved R15, so the saved
  1792. framepointer is at R11-12 (for get_caller_frame) }
  1793. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  1794. a_reg_dealloc(list,NR_R12);
  1795. end;
  1796. end
  1797. else
  1798. begin
  1799. { always save r14 if we use r7 as the framepointer, because
  1800. the parameter offsets are hardcoded in advance and always
  1801. assume that r14 sits on the stack right behind the saved r7
  1802. }
  1803. if current_procinfo.framepointer=NR_FRAME_POINTER_REG then
  1804. include(regs,RS_FRAME_POINTER_REG);
  1805. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1806. include(regs,RS_R14);
  1807. if regs<>[] then
  1808. begin
  1809. { on Darwin, you first have to save [r4-r7,lr], and then
  1810. [r8,r10,r11] and make r7 point to the previously saved
  1811. r7 so that you can perform a stack crawl based on it
  1812. ([r7] is previous stack frame, [r7+4] is return address
  1813. }
  1814. include(regs,RS_FRAME_POINTER_REG);
  1815. saveregs:=regs-[RS_R8,RS_R10,RS_R11];
  1816. r7offset:=0;
  1817. for r:=RS_R0 to RS_R15 do
  1818. if r in saveregs then
  1819. begin
  1820. inc(registerarea,4);
  1821. if r<RS_FRAME_POINTER_REG then
  1822. inc(r7offset,4);
  1823. end;
  1824. { save the registers }
  1825. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1826. { make r7 point to the saved r7 (regardless of whether this
  1827. frame uses the framepointer, for backtrace purposes) }
  1828. if r7offset<>0 then
  1829. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_FRAME_POINTER_REG,NR_R13,r7offset))
  1830. else
  1831. list.concat(taicpu.op_reg_reg(A_MOV,NR_R7,NR_R13));
  1832. { now save the rest (if any) }
  1833. saveregs:=regs-saveregs;
  1834. if saveregs<>[] then
  1835. begin
  1836. for r:=RS_R8 to RS_R11 do
  1837. if r in saveregs then
  1838. inc(registerarea,4);
  1839. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1840. end;
  1841. end;
  1842. end;
  1843. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  1844. if (LocalSize<>0) or
  1845. ((stackmisalignment<>0) and
  1846. ((pi_do_call in current_procinfo.flags) or
  1847. (po_assembler in current_procinfo.procdef.procoptions))) then
  1848. begin
  1849. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  1850. if stack_parameters and (pi_estimatestacksize in current_procinfo.flags) then
  1851. begin
  1852. if localsize>tarmprocinfo(current_procinfo).stackframesize then
  1853. internalerror(2014030901)
  1854. else
  1855. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea;
  1856. end;
  1857. if is_shifter_const(localsize,shift) then
  1858. begin
  1859. a_reg_dealloc(list,NR_R12);
  1860. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  1861. end
  1862. else if split_into_shifter_const(localsize, imm1, imm2) then
  1863. begin
  1864. a_reg_dealloc(list,NR_R12);
  1865. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  1866. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  1867. end
  1868. else
  1869. begin
  1870. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  1871. a_reg_alloc(list,NR_R12);
  1872. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  1873. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  1874. a_reg_dealloc(list,NR_R12);
  1875. end;
  1876. end;
  1877. if (mmregs<>[]) or
  1878. (firstfloatreg<>RS_NO) then
  1879. begin
  1880. reference_reset(ref,4);
  1881. if (tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023) or
  1882. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv3_d16]) then
  1883. begin
  1884. if not is_shifter_const(tarmprocinfo(current_procinfo).floatregstart,shift) then
  1885. begin
  1886. a_reg_alloc(list,NR_R12);
  1887. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  1888. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1889. a_reg_dealloc(list,NR_R12);
  1890. end
  1891. else
  1892. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tarmprocinfo(current_procinfo).floatregstart));
  1893. ref.base:=NR_R12;
  1894. end
  1895. else
  1896. begin
  1897. ref.base:=current_procinfo.framepointer;
  1898. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  1899. end;
  1900. case current_settings.fputype of
  1901. fpu_fpa,
  1902. fpu_fpa10,
  1903. fpu_fpa11:
  1904. begin
  1905. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  1906. lastfloatreg-firstfloatreg+1,ref));
  1907. end;
  1908. fpu_vfpv2,
  1909. fpu_vfpv3,
  1910. fpu_vfpv3_d16:
  1911. begin
  1912. ref.index:=ref.base;
  1913. ref.base:=NR_NO;
  1914. { FSTMX is deprecated on ARMv6 and later }
  1915. {if (current_settings.cputype<cpu_armv6) then
  1916. postfix:=PF_IAX
  1917. else
  1918. postfix:=PF_IAD;}
  1919. list.concat(taicpu.op_ref_regset(A_VSTM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  1920. end;
  1921. end;
  1922. end;
  1923. end;
  1924. end;
  1925. procedure tbasecgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  1926. var
  1927. ref : treference;
  1928. LocalSize : longint;
  1929. firstfloatreg,lastfloatreg,
  1930. r,
  1931. shift : byte;
  1932. mmregs,
  1933. saveregs,
  1934. regs : tcpuregisterset;
  1935. registerarea,
  1936. stackmisalignment: pint;
  1937. paddingreg: TSuperRegister;
  1938. mmpostfix: toppostfix;
  1939. imm1, imm2: DWord;
  1940. begin
  1941. if not(nostackframe) then
  1942. begin
  1943. registerarea:=0;
  1944. firstfloatreg:=RS_NO;
  1945. lastfloatreg:=RS_NO;
  1946. mmregs:=[];
  1947. saveregs:=[];
  1948. case current_settings.fputype of
  1949. fpu_fpa,
  1950. fpu_fpa10,
  1951. fpu_fpa11:
  1952. begin
  1953. { restore floating point registers? }
  1954. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1955. for r:=RS_F0 to RS_F7 do
  1956. if r in regs then
  1957. begin
  1958. if firstfloatreg=RS_NO then
  1959. firstfloatreg:=r;
  1960. lastfloatreg:=r;
  1961. { floating point register space is already included in
  1962. localsize below by calc_stackframe_size
  1963. inc(registerarea,12);
  1964. }
  1965. end;
  1966. end;
  1967. fpu_vfpv2,
  1968. fpu_vfpv3,
  1969. fpu_vfpv3_d16:
  1970. begin;
  1971. { restore vfp registers? }
  1972. mmregs:=rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall);
  1973. end;
  1974. end;
  1975. if (firstfloatreg<>RS_NO) or
  1976. (mmregs<>[]) then
  1977. begin
  1978. reference_reset(ref,4);
  1979. if (tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023) or
  1980. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv3_d16]) then
  1981. begin
  1982. if not is_shifter_const(tarmprocinfo(current_procinfo).floatregstart,shift) then
  1983. begin
  1984. a_reg_alloc(list,NR_R12);
  1985. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  1986. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1987. a_reg_dealloc(list,NR_R12);
  1988. end
  1989. else
  1990. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tarmprocinfo(current_procinfo).floatregstart));
  1991. ref.base:=NR_R12;
  1992. end
  1993. else
  1994. begin
  1995. ref.base:=current_procinfo.framepointer;
  1996. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  1997. end;
  1998. case current_settings.fputype of
  1999. fpu_fpa,
  2000. fpu_fpa10,
  2001. fpu_fpa11:
  2002. begin
  2003. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  2004. lastfloatreg-firstfloatreg+1,ref));
  2005. end;
  2006. fpu_vfpv2,
  2007. fpu_vfpv3,
  2008. fpu_vfpv3_d16:
  2009. begin
  2010. ref.index:=ref.base;
  2011. ref.base:=NR_NO;
  2012. { FLDMX is deprecated on ARMv6 and later }
  2013. {if (current_settings.cputype<cpu_armv6) then
  2014. mmpostfix:=PF_IAX
  2015. else
  2016. mmpostfix:=PF_IAD;}
  2017. list.concat(taicpu.op_ref_regset(A_VLDM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  2018. end;
  2019. end;
  2020. end;
  2021. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  2022. if (pi_do_call in current_procinfo.flags) or
  2023. (regs<>[]) or
  2024. ((target_info.system in systems_darwin) and
  2025. (current_procinfo.framepointer<>NR_STACK_POINTER_REG)) then
  2026. begin
  2027. exclude(regs,RS_R14);
  2028. include(regs,RS_R15);
  2029. if (target_info.system in systems_darwin) then
  2030. include(regs,RS_FRAME_POINTER_REG);
  2031. end;
  2032. if not(target_info.system in systems_darwin) then
  2033. begin
  2034. { restore saved stack pointer to SP (R13) and saved lr to PC (R15).
  2035. The saved PC came after that but is discarded, since we restore
  2036. the stack pointer }
  2037. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  2038. regs:=regs+[RS_FRAME_POINTER_REG,RS_R13,RS_R15];
  2039. end
  2040. else
  2041. begin
  2042. { restore R8-R11 already if necessary (they've been stored
  2043. before the others) }
  2044. saveregs:=regs*[RS_R8,RS_R10,RS_R11];
  2045. if saveregs<>[] then
  2046. begin
  2047. reference_reset(ref,4);
  2048. ref.index:=NR_STACK_POINTER_REG;
  2049. ref.addressmode:=AM_PREINDEXED;
  2050. for r:=RS_R8 to RS_R11 do
  2051. if r in saveregs then
  2052. inc(registerarea,4);
  2053. regs:=regs-saveregs;
  2054. end;
  2055. end;
  2056. for r:=RS_R0 to RS_R15 do
  2057. if r in regs then
  2058. inc(registerarea,4);
  2059. { reapply the stack padding reg, in case there was one, see the complimentary
  2060. comment in g_proc_entry() (KB) }
  2061. paddingreg:=tarmprocinfo(current_procinfo).stackpaddingreg;
  2062. if paddingreg < RS_R4 then
  2063. if paddingreg in regs then
  2064. internalerror(201306190)
  2065. else
  2066. begin
  2067. regs:=regs+[paddingreg];
  2068. inc(registerarea,4);
  2069. end;
  2070. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  2071. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  2072. (target_info.system in systems_darwin) then
  2073. begin
  2074. LocalSize:=current_procinfo.calc_stackframe_size;
  2075. if (LocalSize<>0) or
  2076. ((stackmisalignment<>0) and
  2077. ((pi_do_call in current_procinfo.flags) or
  2078. (po_assembler in current_procinfo.procdef.procoptions))) then
  2079. begin
  2080. if pi_estimatestacksize in current_procinfo.flags then
  2081. LocalSize:=tarmprocinfo(current_procinfo).stackframesize-registerarea
  2082. else
  2083. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  2084. if is_shifter_const(LocalSize,shift) then
  2085. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  2086. else if split_into_shifter_const(localsize, imm1, imm2) then
  2087. begin
  2088. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  2089. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  2090. end
  2091. else
  2092. begin
  2093. a_reg_alloc(list,NR_R12);
  2094. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  2095. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  2096. a_reg_dealloc(list,NR_R12);
  2097. end;
  2098. end;
  2099. if (target_info.system in systems_darwin) and
  2100. (saveregs<>[]) then
  2101. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  2102. if regs=[] then
  2103. begin
  2104. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2105. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2106. else
  2107. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2108. end
  2109. else
  2110. begin
  2111. reference_reset(ref,4);
  2112. ref.index:=NR_STACK_POINTER_REG;
  2113. ref.addressmode:=AM_PREINDEXED;
  2114. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  2115. end;
  2116. end
  2117. else
  2118. begin
  2119. { restore int registers and return }
  2120. reference_reset(ref,4);
  2121. ref.index:=NR_FRAME_POINTER_REG;
  2122. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_EA));
  2123. end;
  2124. end
  2125. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2126. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2127. else
  2128. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2129. end;
  2130. procedure tbasecgarm.g_maybe_got_init(list : TAsmList);
  2131. var
  2132. ref : treference;
  2133. l : TAsmLabel;
  2134. begin
  2135. if (cs_create_pic in current_settings.moduleswitches) and
  2136. (pi_needs_got in current_procinfo.flags) and
  2137. (tf_pic_uses_got in target_info.flags) then
  2138. begin
  2139. reference_reset(ref,4);
  2140. current_asmdata.getglobaldatalabel(l);
  2141. cg.a_label(current_procinfo.aktlocaldata,l);
  2142. ref.symbol:=l;
  2143. ref.base:=NR_PC;
  2144. ref.symboldata:=current_procinfo.aktlocaldata.last;
  2145. list.concat(Taicpu.op_reg_ref(A_LDR,current_procinfo.got,ref));
  2146. current_asmdata.getaddrlabel(l);
  2147. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_32bit,l,current_asmdata.RefAsmSymbol('_GLOBAL_OFFSET_TABLE_'),-8));
  2148. cg.a_label(list,l);
  2149. list.concat(Taicpu.op_reg_reg_reg(A_ADD,current_procinfo.got,NR_PC,current_procinfo.got));
  2150. end;
  2151. end;
  2152. procedure tbasecgarm.a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);
  2153. var
  2154. b : byte;
  2155. tmpref : treference;
  2156. instr : taicpu;
  2157. begin
  2158. if ref.addressmode<>AM_OFFSET then
  2159. internalerror(200309071);
  2160. tmpref:=ref;
  2161. { Be sure to have a base register }
  2162. if (tmpref.base=NR_NO) then
  2163. begin
  2164. if tmpref.shiftmode<>SM_None then
  2165. internalerror(2014020702);
  2166. if tmpref.signindex<0 then
  2167. internalerror(200312023);
  2168. tmpref.base:=tmpref.index;
  2169. tmpref.index:=NR_NO;
  2170. end;
  2171. if assigned(tmpref.symbol) or
  2172. not((is_shifter_const(tmpref.offset,b)) or
  2173. (is_shifter_const(-tmpref.offset,b))
  2174. ) then
  2175. fixref(list,tmpref);
  2176. { expect a base here if there is an index }
  2177. if (tmpref.base=NR_NO) and (tmpref.index<>NR_NO) then
  2178. internalerror(200312022);
  2179. if tmpref.index<>NR_NO then
  2180. begin
  2181. if tmpref.shiftmode<>SM_None then
  2182. internalerror(200312021);
  2183. if tmpref.signindex<0 then
  2184. a_op_reg_reg_reg(list,OP_SUB,OS_ADDR,tmpref.base,tmpref.index,r)
  2185. else
  2186. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpref.base,tmpref.index,r);
  2187. if tmpref.offset<>0 then
  2188. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,r,r);
  2189. end
  2190. else
  2191. begin
  2192. if tmpref.base=NR_NO then
  2193. a_load_const_reg(list,OS_ADDR,tmpref.offset,r)
  2194. else
  2195. if tmpref.offset<>0 then
  2196. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,tmpref.base,r)
  2197. else
  2198. begin
  2199. instr:=taicpu.op_reg_reg(A_MOV,r,tmpref.base);
  2200. list.concat(instr);
  2201. add_move_instruction(instr);
  2202. end;
  2203. end;
  2204. end;
  2205. procedure tbasecgarm.fixref(list : TAsmList;var ref : treference);
  2206. var
  2207. tmpreg, tmpreg2 : tregister;
  2208. tmpref : treference;
  2209. l, piclabel : tasmlabel;
  2210. indirection_done : boolean;
  2211. begin
  2212. { absolute symbols can't be handled directly, we've to store the symbol reference
  2213. in the text segment and access it pc relative
  2214. For now, we assume that references where base or index equals to PC are already
  2215. relative, all other references are assumed to be absolute and thus they need
  2216. to be handled extra.
  2217. A proper solution would be to change refoptions to a set and store the information
  2218. if the symbol is absolute or relative there.
  2219. }
  2220. { create consts entry }
  2221. reference_reset(tmpref,4);
  2222. current_asmdata.getjumplabel(l);
  2223. cg.a_label(current_procinfo.aktlocaldata,l);
  2224. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  2225. piclabel:=nil;
  2226. tmpreg:=NR_NO;
  2227. indirection_done:=false;
  2228. if assigned(ref.symbol) then
  2229. begin
  2230. if (target_info.system=system_arm_darwin) and
  2231. (ref.symbol.bind in [AB_EXTERNAL,AB_WEAK_EXTERNAL,AB_PRIVATE_EXTERN,AB_COMMON]) then
  2232. begin
  2233. tmpreg:=g_indirect_sym_load(list,ref.symbol.name,asmsym2indsymflags(ref.symbol));
  2234. if ref.offset<>0 then
  2235. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2236. indirection_done:=true;
  2237. end
  2238. else if (cs_create_pic in current_settings.moduleswitches) then
  2239. if (tf_pic_uses_got in target_info.flags) then
  2240. current_procinfo.aktlocaldata.concat(tai_const.Create_type_sym_offset(aitconst_got,ref.symbol,ref.offset))
  2241. else
  2242. begin
  2243. { ideally, we would want to generate
  2244. ldr r1, LPICConstPool
  2245. LPICLocal:
  2246. ldr/str r2,[pc,r1]
  2247. ...
  2248. LPICConstPool:
  2249. .long _globsym-(LPICLocal+8)
  2250. However, we cannot be sure that the ldr/str will follow
  2251. right after the call to fixref, so we have to load the
  2252. complete address already in a register.
  2253. }
  2254. current_asmdata.getaddrlabel(piclabel);
  2255. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_ptr,piclabel,ref.symbol,ref.offset-8));
  2256. end
  2257. else
  2258. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset))
  2259. end
  2260. else
  2261. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ref.offset));
  2262. { load consts entry }
  2263. if not indirection_done then
  2264. begin
  2265. tmpreg:=getintregister(list,OS_INT);
  2266. tmpref.symbol:=l;
  2267. tmpref.base:=NR_PC;
  2268. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2269. if (cs_create_pic in current_settings.moduleswitches) and
  2270. (tf_pic_uses_got in target_info.flags) and
  2271. assigned(ref.symbol) then
  2272. begin
  2273. reference_reset(tmpref,4);
  2274. tmpref.base:=current_procinfo.got;
  2275. tmpref.index:=tmpreg;
  2276. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2277. end;
  2278. end;
  2279. if assigned(piclabel) then
  2280. begin
  2281. cg.a_label(list,piclabel);
  2282. tmpreg2:=getaddressregister(list);
  2283. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpreg,NR_PC,tmpreg2);
  2284. tmpreg:=tmpreg2
  2285. end;
  2286. { This routine can be called with PC as base/index in case the offset
  2287. was too large to encode in a load/store. In that case, the entire
  2288. absolute expression has been re-encoded in a new constpool entry, and
  2289. we have to remove the use of PC from the original reference (the code
  2290. above made everything relative to the value loaded from the new
  2291. constpool entry) }
  2292. if is_pc(ref.base) then
  2293. ref.base:=NR_NO;
  2294. if is_pc(ref.index) then
  2295. ref.index:=NR_NO;
  2296. if (ref.base<>NR_NO) then
  2297. begin
  2298. if ref.index<>NR_NO then
  2299. begin
  2300. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  2301. ref.base:=tmpreg;
  2302. end
  2303. else
  2304. if ref.base<>NR_PC then
  2305. begin
  2306. ref.index:=tmpreg;
  2307. ref.shiftimm:=0;
  2308. ref.signindex:=1;
  2309. ref.shiftmode:=SM_None;
  2310. end
  2311. else
  2312. ref.base:=tmpreg;
  2313. end
  2314. else
  2315. ref.base:=tmpreg;
  2316. ref.offset:=0;
  2317. ref.symbol:=nil;
  2318. end;
  2319. procedure tbasecgarm.g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  2320. var
  2321. paraloc1,paraloc2,paraloc3 : TCGPara;
  2322. pd : tprocdef;
  2323. begin
  2324. pd:=search_system_proc('MOVE');
  2325. paraloc1.init;
  2326. paraloc2.init;
  2327. paraloc3.init;
  2328. paramanager.getintparaloc(list,pd,1,paraloc1);
  2329. paramanager.getintparaloc(list,pd,2,paraloc2);
  2330. paramanager.getintparaloc(list,pd,3,paraloc3);
  2331. a_load_const_cgpara(list,OS_SINT,len,paraloc3);
  2332. a_loadaddr_ref_cgpara(list,dest,paraloc2);
  2333. a_loadaddr_ref_cgpara(list,source,paraloc1);
  2334. paramanager.freecgpara(list,paraloc3);
  2335. paramanager.freecgpara(list,paraloc2);
  2336. paramanager.freecgpara(list,paraloc1);
  2337. alloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2338. alloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2339. a_call_name(list,'FPC_MOVE',false);
  2340. dealloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2341. dealloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2342. paraloc3.done;
  2343. paraloc2.done;
  2344. paraloc1.done;
  2345. end;
  2346. procedure tbasecgarm.g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  2347. const
  2348. maxtmpreg_arm = 10; {roozbeh: can be reduced to 8 or lower if might conflick with reserved ones,also +2 is used becouse of regs required for referencing}
  2349. maxtmpreg_thumb = 5;
  2350. var
  2351. srcref,dstref,usedtmpref,usedtmpref2:treference;
  2352. srcreg,destreg,countreg,r,tmpreg:tregister;
  2353. helpsize:aint;
  2354. copysize:byte;
  2355. cgsize:Tcgsize;
  2356. tmpregisters:array[1..maxtmpreg_arm] of tregister;
  2357. maxtmpreg,
  2358. tmpregi,tmpregi2:byte;
  2359. { will never be called with count<=4 }
  2360. procedure genloop(count : aword;size : byte);
  2361. const
  2362. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2363. var
  2364. l : tasmlabel;
  2365. begin
  2366. current_asmdata.getjumplabel(l);
  2367. if count<size then size:=1;
  2368. a_load_const_reg(list,OS_INT,count div size,countreg);
  2369. cg.a_label(list,l);
  2370. srcref.addressmode:=AM_POSTINDEXED;
  2371. dstref.addressmode:=AM_POSTINDEXED;
  2372. srcref.offset:=size;
  2373. dstref.offset:=size;
  2374. r:=getintregister(list,size2opsize[size]);
  2375. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2376. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2377. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1),PF_S));
  2378. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2379. a_jmp_flags(list,F_NE,l);
  2380. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2381. srcref.offset:=1;
  2382. dstref.offset:=1;
  2383. case count mod size of
  2384. 1:
  2385. begin
  2386. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2387. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2388. end;
  2389. 2:
  2390. if aligned then
  2391. begin
  2392. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2393. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2394. end
  2395. else
  2396. begin
  2397. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2398. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2399. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2400. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2401. end;
  2402. 3:
  2403. if aligned then
  2404. begin
  2405. srcref.offset:=2;
  2406. dstref.offset:=2;
  2407. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2408. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2409. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2410. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2411. end
  2412. else
  2413. begin
  2414. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2415. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2416. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2417. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2418. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2419. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2420. end;
  2421. end;
  2422. { keep the registers alive }
  2423. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2424. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2425. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2426. end;
  2427. { will never be called with count<=4 }
  2428. procedure genloop_thumb(count : aword;size : byte);
  2429. procedure refincofs(const ref : treference;const value : longint = 1);
  2430. begin
  2431. a_op_const_reg(list,OP_ADD,OS_ADDR,value,ref.base);
  2432. end;
  2433. const
  2434. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2435. var
  2436. l : tasmlabel;
  2437. begin
  2438. current_asmdata.getjumplabel(l);
  2439. if count<size then size:=1;
  2440. a_load_const_reg(list,OS_INT,count div size,countreg);
  2441. cg.a_label(list,l);
  2442. r:=getintregister(list,size2opsize[size]);
  2443. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2444. refincofs(srcref);
  2445. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2446. refincofs(dstref);
  2447. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2448. list.concat(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1));
  2449. a_jmp_flags(list,F_NE,l);
  2450. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2451. case count mod size of
  2452. 1:
  2453. begin
  2454. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2455. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2456. end;
  2457. 2:
  2458. if aligned then
  2459. begin
  2460. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2461. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2462. end
  2463. else
  2464. begin
  2465. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2466. refincofs(srcref);
  2467. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2468. refincofs(dstref);
  2469. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2470. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2471. end;
  2472. 3:
  2473. if aligned then
  2474. begin
  2475. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2476. refincofs(srcref,2);
  2477. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2478. refincofs(dstref,2);
  2479. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2480. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2481. end
  2482. else
  2483. begin
  2484. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2485. refincofs(srcref);
  2486. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2487. refincofs(dstref);
  2488. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2489. refincofs(srcref);
  2490. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2491. refincofs(dstref);
  2492. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2493. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2494. end;
  2495. end;
  2496. { keep the registers alive }
  2497. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2498. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2499. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2500. end;
  2501. begin
  2502. if len=0 then
  2503. exit;
  2504. if GenerateThumbCode then
  2505. maxtmpreg:=maxtmpreg_thumb
  2506. else
  2507. maxtmpreg:=maxtmpreg_arm;
  2508. helpsize:=12+maxtmpreg*4;//52 with maxtmpreg=10
  2509. dstref:=dest;
  2510. srcref:=source;
  2511. if cs_opt_size in current_settings.optimizerswitches then
  2512. helpsize:=8;
  2513. if aligned and (len=4) then
  2514. begin
  2515. tmpreg:=getintregister(list,OS_32);
  2516. a_load_ref_reg(list,OS_32,OS_32,source,tmpreg);
  2517. a_load_reg_ref(list,OS_32,OS_32,tmpreg,dest);
  2518. end
  2519. else if aligned and (len=2) then
  2520. begin
  2521. tmpreg:=getintregister(list,OS_16);
  2522. a_load_ref_reg(list,OS_16,OS_16,source,tmpreg);
  2523. a_load_reg_ref(list,OS_16,OS_16,tmpreg,dest);
  2524. end
  2525. else if (len<=helpsize) and aligned then
  2526. begin
  2527. tmpregi:=0;
  2528. srcreg:=getintregister(list,OS_ADDR);
  2529. { explicit pc relative addressing, could be
  2530. e.g. a floating point constant }
  2531. if source.base=NR_PC then
  2532. begin
  2533. { ... then we don't need a loadaddr }
  2534. srcref:=source;
  2535. end
  2536. else
  2537. begin
  2538. a_loadaddr_ref_reg(list,source,srcreg);
  2539. reference_reset_base(srcref,srcreg,0,source.alignment);
  2540. end;
  2541. while (len div 4 <> 0) and (tmpregi<maxtmpreg) do
  2542. begin
  2543. inc(tmpregi);
  2544. tmpregisters[tmpregi]:=getintregister(list,OS_32);
  2545. a_load_ref_reg(list,OS_32,OS_32,srcref,tmpregisters[tmpregi]);
  2546. inc(srcref.offset,4);
  2547. dec(len,4);
  2548. end;
  2549. destreg:=getintregister(list,OS_ADDR);
  2550. a_loadaddr_ref_reg(list,dest,destreg);
  2551. reference_reset_base(dstref,destreg,0,dest.alignment);
  2552. tmpregi2:=1;
  2553. while (tmpregi2<=tmpregi) do
  2554. begin
  2555. a_load_reg_ref(list,OS_32,OS_32,tmpregisters[tmpregi2],dstref);
  2556. inc(dstref.offset,4);
  2557. inc(tmpregi2);
  2558. end;
  2559. copysize:=4;
  2560. cgsize:=OS_32;
  2561. while len<>0 do
  2562. begin
  2563. if len<2 then
  2564. begin
  2565. copysize:=1;
  2566. cgsize:=OS_8;
  2567. end
  2568. else if len<4 then
  2569. begin
  2570. copysize:=2;
  2571. cgsize:=OS_16;
  2572. end;
  2573. dec(len,copysize);
  2574. r:=getintregister(list,cgsize);
  2575. a_load_ref_reg(list,cgsize,cgsize,srcref,r);
  2576. a_load_reg_ref(list,cgsize,cgsize,r,dstref);
  2577. inc(srcref.offset,copysize);
  2578. inc(dstref.offset,copysize);
  2579. end;{end of while}
  2580. end
  2581. else
  2582. begin
  2583. cgsize:=OS_32;
  2584. if (len<=4) then{len<=4 and not aligned}
  2585. begin
  2586. r:=getintregister(list,cgsize);
  2587. usedtmpref:=a_internal_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2588. if Len=1 then
  2589. a_load_reg_ref(list,OS_8,OS_8,r,dstref)
  2590. else
  2591. begin
  2592. tmpreg:=getintregister(list,cgsize);
  2593. usedtmpref2:=a_internal_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2594. inc(usedtmpref.offset,1);
  2595. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2596. inc(usedtmpref2.offset,1);
  2597. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2598. if len>2 then
  2599. begin
  2600. inc(usedtmpref.offset,1);
  2601. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2602. inc(usedtmpref2.offset,1);
  2603. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2604. if len>3 then
  2605. begin
  2606. inc(usedtmpref.offset,1);
  2607. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2608. inc(usedtmpref2.offset,1);
  2609. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2610. end;
  2611. end;
  2612. end;
  2613. end{end of if len<=4}
  2614. else
  2615. begin{unaligned & 4<len<helpsize **or** aligned/unaligned & len>helpsize}
  2616. destreg:=getintregister(list,OS_ADDR);
  2617. a_loadaddr_ref_reg(list,dest,destreg);
  2618. reference_reset_base(dstref,destreg,0,dest.alignment);
  2619. srcreg:=getintregister(list,OS_ADDR);
  2620. a_loadaddr_ref_reg(list,source,srcreg);
  2621. reference_reset_base(srcref,srcreg,0,source.alignment);
  2622. countreg:=getintregister(list,OS_32);
  2623. // if cs_opt_size in current_settings.optimizerswitches then
  2624. { roozbeh : it seems loading 1 byte is faster becouse of caching/fetching(?) }
  2625. {if aligned then
  2626. genloop(len,4)
  2627. else}
  2628. if GenerateThumbCode then
  2629. genloop_thumb(len,1)
  2630. else
  2631. genloop(len,1);
  2632. end;
  2633. end;
  2634. end;
  2635. procedure tbasecgarm.g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);
  2636. begin
  2637. g_concatcopy_internal(list,source,dest,len,false);
  2638. end;
  2639. procedure tbasecgarm.g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);
  2640. begin
  2641. if (source.alignment in [1,3]) or
  2642. (dest.alignment in [1,3]) then
  2643. g_concatcopy_internal(list,source,dest,len,false)
  2644. else
  2645. g_concatcopy_internal(list,source,dest,len,true);
  2646. end;
  2647. procedure tbasecgarm.g_overflowCheck(list : TAsmList;const l : tlocation;def : tdef);
  2648. var
  2649. ovloc : tlocation;
  2650. begin
  2651. ovloc.loc:=LOC_VOID;
  2652. g_overflowCheck_loc(list,l,def,ovloc);
  2653. end;
  2654. procedure tbasecgarm.g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);
  2655. var
  2656. hl : tasmlabel;
  2657. ai:TAiCpu;
  2658. hflags : tresflags;
  2659. begin
  2660. if not(cs_check_overflow in current_settings.localswitches) then
  2661. exit;
  2662. current_asmdata.getjumplabel(hl);
  2663. case ovloc.loc of
  2664. LOC_VOID:
  2665. begin
  2666. ai:=taicpu.op_sym(A_B,hl);
  2667. ai.is_jmp:=true;
  2668. if not((def.typ=pointerdef) or
  2669. ((def.typ=orddef) and
  2670. (torddef(def).ordtype in [u64bit,u16bit,u32bit,u8bit,uchar,
  2671. pasbool8,pasbool16,pasbool32,pasbool64]))) then
  2672. ai.SetCondition(C_VC)
  2673. else
  2674. if TAiCpu(List.Last).opcode in [A_RSB,A_RSC,A_SBC,A_SUB] then
  2675. ai.SetCondition(C_CS)
  2676. else
  2677. ai.SetCondition(C_CC);
  2678. list.concat(ai);
  2679. end;
  2680. LOC_FLAGS:
  2681. begin
  2682. hflags:=ovloc.resflags;
  2683. inverse_flags(hflags);
  2684. cg.a_jmp_flags(list,hflags,hl);
  2685. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2686. end;
  2687. else
  2688. internalerror(200409281);
  2689. end;
  2690. a_call_name(list,'FPC_OVERFLOW',false);
  2691. a_label(list,hl);
  2692. end;
  2693. procedure tbasecgarm.g_save_registers(list : TAsmList);
  2694. begin
  2695. { this work is done in g_proc_entry }
  2696. end;
  2697. procedure tbasecgarm.g_restore_registers(list : TAsmList);
  2698. begin
  2699. { this work is done in g_proc_exit }
  2700. end;
  2701. procedure tbasecgarm.a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  2702. var
  2703. ai : taicpu;
  2704. hlabel : TAsmLabel;
  2705. begin
  2706. if GenerateThumbCode then
  2707. begin
  2708. { the optimizer has to fix this if jump range is sufficient short }
  2709. current_asmdata.getjumplabel(hlabel);
  2710. ai:=Taicpu.Op_sym(A_B,hlabel);
  2711. ai.SetCondition(inverse_cond(OpCmp2AsmCond[cond]));
  2712. ai.is_jmp:=true;
  2713. list.concat(ai);
  2714. a_jmp_always(list,l);
  2715. a_label(list,hlabel);
  2716. end
  2717. else
  2718. begin
  2719. ai:=Taicpu.Op_sym(A_B,l);
  2720. ai.SetCondition(OpCmp2AsmCond[cond]);
  2721. ai.is_jmp:=true;
  2722. list.concat(ai);
  2723. end;
  2724. end;
  2725. function get_scalar_mm_op(fromsize,tosize : tcgsize) : tasmop;
  2726. const
  2727. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of tasmop = (
  2728. (A_VMOV,A_VCVT,A_NONE,A_NONE,A_NONE),
  2729. (A_VCVT,A_VMOV,A_NONE,A_NONE,A_NONE),
  2730. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2731. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2732. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE));
  2733. begin
  2734. result:=convertop[fromsize,tosize];
  2735. if result=A_NONE then
  2736. internalerror(200312205);
  2737. end;
  2738. function get_scalar_mm_prefix(fromsize,tosize : tcgsize) : TOpPostfix;
  2739. const
  2740. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of TOpPostfix = (
  2741. (PF_F32, PF_F32F64,PF_None,PF_None,PF_None),
  2742. (PF_F64F32,PF_F64, PF_None,PF_None,PF_None),
  2743. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2744. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2745. (PF_None, PF_None, PF_None,PF_None,PF_None));
  2746. begin
  2747. result:=convertop[fromsize,tosize];
  2748. end;
  2749. procedure tbasecgarm.a_loadmm_reg_reg(list: tasmlist; fromsize,tosize: tcgsize; reg1,reg2: tregister; shuffle: pmmshuffle);
  2750. var
  2751. instr: taicpu;
  2752. begin
  2753. if (shuffle=nil) or shufflescalar(shuffle) then
  2754. instr:=setoppostfix(taicpu.op_reg_reg(get_scalar_mm_op(tosize,fromsize),reg2,reg1),get_scalar_mm_prefix(tosize,fromsize))
  2755. else
  2756. internalerror(2009112407);
  2757. list.concat(instr);
  2758. case instr.opcode of
  2759. A_VMOV:
  2760. add_move_instruction(instr);
  2761. end;
  2762. end;
  2763. procedure tbasecgarm.a_loadmm_ref_reg(list: tasmlist; fromsize,tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  2764. var
  2765. intreg,
  2766. tmpmmreg : tregister;
  2767. reg64 : tregister64;
  2768. begin
  2769. if assigned(shuffle) and
  2770. not(shufflescalar(shuffle)) then
  2771. internalerror(2009112413);
  2772. case fromsize of
  2773. OS_32,OS_S32:
  2774. begin
  2775. fromsize:=OS_F32;
  2776. { since we are loading an integer, no conversion may be required }
  2777. if (fromsize<>tosize) then
  2778. internalerror(2009112801);
  2779. end;
  2780. OS_64,OS_S64:
  2781. begin
  2782. fromsize:=OS_F64;
  2783. { since we are loading an integer, no conversion may be required }
  2784. if (fromsize<>tosize) then
  2785. internalerror(2009112901);
  2786. end;
  2787. end;
  2788. if (fromsize<>tosize) then
  2789. tmpmmreg:=getmmregister(list,fromsize)
  2790. else
  2791. tmpmmreg:=reg;
  2792. if (ref.alignment in [1,2]) then
  2793. begin
  2794. case fromsize of
  2795. OS_F32:
  2796. begin
  2797. intreg:=getintregister(list,OS_32);
  2798. a_load_ref_reg(list,OS_32,OS_32,ref,intreg);
  2799. a_loadmm_intreg_reg(list,OS_32,OS_F32,intreg,tmpmmreg,mms_movescalar);
  2800. end;
  2801. OS_F64:
  2802. begin
  2803. reg64.reglo:=getintregister(list,OS_32);
  2804. reg64.reghi:=getintregister(list,OS_32);
  2805. cg64.a_load64_ref_reg(list,ref,reg64);
  2806. cg64.a_loadmm_intreg64_reg(list,OS_F64,reg64,tmpmmreg);
  2807. end;
  2808. else
  2809. internalerror(2009112412);
  2810. end;
  2811. end
  2812. else
  2813. begin
  2814. handle_load_store(list,A_VLDR,PF_None,tmpmmreg,ref);
  2815. end;
  2816. if (tmpmmreg<>reg) then
  2817. a_loadmm_reg_reg(list,fromsize,tosize,tmpmmreg,reg,shuffle);
  2818. end;
  2819. procedure tbasecgarm.a_loadmm_reg_ref(list: tasmlist; fromsize,tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  2820. var
  2821. intreg,
  2822. tmpmmreg : tregister;
  2823. reg64 : tregister64;
  2824. begin
  2825. if assigned(shuffle) and
  2826. not(shufflescalar(shuffle)) then
  2827. internalerror(2009112416);
  2828. case tosize of
  2829. OS_32,OS_S32:
  2830. begin
  2831. tosize:=OS_F32;
  2832. { since we are loading an integer, no conversion may be required }
  2833. if (fromsize<>tosize) then
  2834. internalerror(2009112801);
  2835. end;
  2836. OS_64,OS_S64:
  2837. begin
  2838. tosize:=OS_F64;
  2839. { since we are loading an integer, no conversion may be required }
  2840. if (fromsize<>tosize) then
  2841. internalerror(2009112901);
  2842. end;
  2843. end;
  2844. if (fromsize<>tosize) then
  2845. begin
  2846. tmpmmreg:=getmmregister(list,tosize);
  2847. a_loadmm_reg_reg(list,fromsize,tosize,reg,tmpmmreg,shuffle);
  2848. end
  2849. else
  2850. tmpmmreg:=reg;
  2851. if (ref.alignment in [1,2]) then
  2852. begin
  2853. case tosize of
  2854. OS_F32:
  2855. begin
  2856. intreg:=getintregister(list,OS_32);
  2857. a_loadmm_reg_intreg(list,OS_F32,OS_32,tmpmmreg,intreg,shuffle);
  2858. a_load_reg_ref(list,OS_32,OS_32,intreg,ref);
  2859. end;
  2860. OS_F64:
  2861. begin
  2862. reg64.reglo:=getintregister(list,OS_32);
  2863. reg64.reghi:=getintregister(list,OS_32);
  2864. cg64.a_loadmm_reg_intreg64(list,OS_F64,tmpmmreg,reg64);
  2865. cg64.a_load64_reg_ref(list,reg64,ref);
  2866. end;
  2867. else
  2868. internalerror(2009112417);
  2869. end;
  2870. end
  2871. else
  2872. begin
  2873. handle_load_store(list,A_VSTR,PF_None,tmpmmreg,ref);
  2874. end;
  2875. end;
  2876. procedure tbasecgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  2877. begin
  2878. { this code can only be used to transfer raw data, not to perform
  2879. conversions }
  2880. if (tosize<>OS_F32) then
  2881. internalerror(2009112419);
  2882. if not(fromsize in [OS_32,OS_S32]) then
  2883. internalerror(2009112420);
  2884. if assigned(shuffle) and
  2885. not shufflescalar(shuffle) then
  2886. internalerror(2009112516);
  2887. list.concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg));
  2888. end;
  2889. procedure tbasecgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize; mmreg, intreg: tregister;shuffle : pmmshuffle);
  2890. begin
  2891. { this code can only be used to transfer raw data, not to perform
  2892. conversions }
  2893. if (fromsize<>OS_F32) then
  2894. internalerror(2009112430);
  2895. if not(tosize in [OS_32,OS_S32]) then
  2896. internalerror(2009112420);
  2897. if assigned(shuffle) and
  2898. not shufflescalar(shuffle) then
  2899. internalerror(2009112514);
  2900. list.concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg));
  2901. end;
  2902. procedure tbasecgarm.a_opmm_reg_reg(list: tasmlist; op: topcg; size: tcgsize; src, dst: tregister; shuffle: pmmshuffle);
  2903. var
  2904. tmpreg: tregister;
  2905. begin
  2906. { the vfp doesn't support xor nor any other logical operation, but
  2907. this routine is used to initialise global mm regvars. We can
  2908. easily initialise an mm reg with 0 though. }
  2909. case op of
  2910. OP_XOR:
  2911. begin
  2912. if (src<>dst) or
  2913. (reg_cgsize(src)<>size) or
  2914. assigned(shuffle) then
  2915. internalerror(2009112907);
  2916. tmpreg:=getintregister(list,OS_32);
  2917. a_load_const_reg(list,OS_32,0,tmpreg);
  2918. case size of
  2919. OS_F32:
  2920. list.concat(taicpu.op_reg_reg(A_VMOV,dst,tmpreg));
  2921. OS_F64:
  2922. list.concat(taicpu.op_reg_reg_reg(A_VMOV,dst,tmpreg,tmpreg));
  2923. else
  2924. internalerror(2009112908);
  2925. end;
  2926. end
  2927. else
  2928. internalerror(2009112906);
  2929. end;
  2930. end;
  2931. procedure tbasecgarm.maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  2932. const
  2933. overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NEG];
  2934. begin
  2935. if (op in overflowops) and
  2936. (size in [OS_8,OS_S8,OS_16,OS_S16]) then
  2937. a_load_reg_reg(list,OS_32,size,dst,dst);
  2938. end;
  2939. procedure tbasecgarm.safe_mla(list : TAsmList; op1,op2,op3,op4 : TRegister);
  2940. procedure checkreg(var reg : TRegister);
  2941. var
  2942. tmpreg : TRegister;
  2943. begin
  2944. if ((GenerateThumbCode or GenerateThumb2Code) and (getsupreg(reg)=RS_R13)) or
  2945. (getsupreg(reg)=RS_R15) then
  2946. begin
  2947. tmpreg:=getintregister(list,OS_INT);
  2948. a_load_reg_reg(list,OS_INT,OS_INT,reg,tmpreg);
  2949. reg:=tmpreg;
  2950. end;
  2951. end;
  2952. begin
  2953. checkreg(op1);
  2954. checkreg(op2);
  2955. checkreg(op3);
  2956. checkreg(op4);
  2957. list.concat(taicpu.op_reg_reg_reg_reg(A_MLA,op1,op2,op3,op4));
  2958. end;
  2959. procedure tcg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  2960. begin
  2961. case op of
  2962. OP_NEG:
  2963. begin
  2964. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2965. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  2966. list.concat(taicpu.op_reg_reg_const(A_RSC,regdst.reghi,regsrc.reghi,0));
  2967. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2968. end;
  2969. OP_NOT:
  2970. begin
  2971. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  2972. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  2973. end;
  2974. else
  2975. a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);
  2976. end;
  2977. end;
  2978. procedure tcg64farm.a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);
  2979. begin
  2980. a_op64_const_reg_reg(list,op,size,value,reg,reg);
  2981. end;
  2982. procedure tcg64farm.a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);
  2983. var
  2984. ovloc : tlocation;
  2985. begin
  2986. a_op64_const_reg_reg_checkoverflow(list,op,size,value,regsrc,regdst,false,ovloc);
  2987. end;
  2988. procedure tcg64farm.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);
  2989. var
  2990. ovloc : tlocation;
  2991. begin
  2992. a_op64_reg_reg_reg_checkoverflow(list,op,size,regsrc1,regsrc2,regdst,false,ovloc);
  2993. end;
  2994. procedure tcg64farm.a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);
  2995. begin
  2996. { this code can only be used to transfer raw data, not to perform
  2997. conversions }
  2998. if (mmsize<>OS_F64) then
  2999. internalerror(2009112405);
  3000. list.concat(taicpu.op_reg_reg_reg(A_VMOV,mmreg,intreg.reglo,intreg.reghi));
  3001. end;
  3002. procedure tcg64farm.a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);
  3003. begin
  3004. { this code can only be used to transfer raw data, not to perform
  3005. conversions }
  3006. if (mmsize<>OS_F64) then
  3007. internalerror(2009112406);
  3008. list.concat(taicpu.op_reg_reg_reg(A_VMOV,intreg.reglo,intreg.reghi,mmreg));
  3009. end;
  3010. procedure tcg64farm.a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3011. var
  3012. tmpreg : tregister;
  3013. b : byte;
  3014. begin
  3015. ovloc.loc:=LOC_VOID;
  3016. case op of
  3017. OP_NEG,
  3018. OP_NOT :
  3019. internalerror(2012022501);
  3020. end;
  3021. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3022. begin
  3023. case op of
  3024. OP_ADD:
  3025. begin
  3026. if is_shifter_const(lo(value),b) then
  3027. begin
  3028. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3029. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3030. end
  3031. else
  3032. begin
  3033. tmpreg:=cg.getintregister(list,OS_32);
  3034. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3035. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3036. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3037. end;
  3038. if is_shifter_const(hi(value),b) then
  3039. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,hi(value)),PF_S))
  3040. else
  3041. begin
  3042. tmpreg:=cg.getintregister(list,OS_32);
  3043. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3044. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3045. end;
  3046. end;
  3047. OP_SUB:
  3048. begin
  3049. if is_shifter_const(lo(value),b) then
  3050. begin
  3051. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3052. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3053. end
  3054. else
  3055. begin
  3056. tmpreg:=cg.getintregister(list,OS_32);
  3057. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3058. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3059. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3060. end;
  3061. if is_shifter_const(hi(value),b) then
  3062. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))),PF_S))
  3063. else
  3064. begin
  3065. tmpreg:=cg.getintregister(list,OS_32);
  3066. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3067. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3068. end;
  3069. end;
  3070. else
  3071. internalerror(200502131);
  3072. end;
  3073. if size=OS_64 then
  3074. begin
  3075. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3076. ovloc.loc:=LOC_FLAGS;
  3077. case op of
  3078. OP_ADD:
  3079. ovloc.resflags:=F_CS;
  3080. OP_SUB:
  3081. ovloc.resflags:=F_CC;
  3082. end;
  3083. end;
  3084. end
  3085. else
  3086. begin
  3087. case op of
  3088. OP_AND,OP_OR,OP_XOR:
  3089. begin
  3090. cg.a_op_const_reg_reg(list,op,OS_32,aint(lo(value)),regsrc.reglo,regdst.reglo);
  3091. cg.a_op_const_reg_reg(list,op,OS_32,aint(hi(value)),regsrc.reghi,regdst.reghi);
  3092. end;
  3093. OP_ADD:
  3094. begin
  3095. if is_shifter_const(aint(lo(value)),b) then
  3096. begin
  3097. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3098. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3099. end
  3100. else
  3101. begin
  3102. tmpreg:=cg.getintregister(list,OS_32);
  3103. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3104. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3105. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3106. end;
  3107. if is_shifter_const(aint(hi(value)),b) then
  3108. list.concat(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3109. else
  3110. begin
  3111. tmpreg:=cg.getintregister(list,OS_32);
  3112. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  3113. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg));
  3114. end;
  3115. end;
  3116. OP_SUB:
  3117. begin
  3118. if is_shifter_const(aint(lo(value)),b) then
  3119. begin
  3120. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3121. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3122. end
  3123. else
  3124. begin
  3125. tmpreg:=cg.getintregister(list,OS_32);
  3126. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3127. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3128. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3129. end;
  3130. if is_shifter_const(aint(hi(value)),b) then
  3131. list.concat(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3132. else
  3133. begin
  3134. tmpreg:=cg.getintregister(list,OS_32);
  3135. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3136. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg));
  3137. end;
  3138. end;
  3139. else
  3140. internalerror(2003083101);
  3141. end;
  3142. end;
  3143. end;
  3144. procedure tcg64farm.a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3145. begin
  3146. ovloc.loc:=LOC_VOID;
  3147. case op of
  3148. OP_NEG,
  3149. OP_NOT :
  3150. internalerror(2012022502);
  3151. end;
  3152. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3153. begin
  3154. case op of
  3155. OP_ADD:
  3156. begin
  3157. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3158. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3159. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi),PF_S));
  3160. end;
  3161. OP_SUB:
  3162. begin
  3163. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3164. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3165. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi),PF_S));
  3166. end;
  3167. else
  3168. internalerror(2003083101);
  3169. end;
  3170. if size=OS_64 then
  3171. begin
  3172. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3173. ovloc.loc:=LOC_FLAGS;
  3174. case op of
  3175. OP_ADD:
  3176. ovloc.resflags:=F_CS;
  3177. OP_SUB:
  3178. ovloc.resflags:=F_CC;
  3179. end;
  3180. end;
  3181. end
  3182. else
  3183. begin
  3184. case op of
  3185. OP_AND,OP_OR,OP_XOR:
  3186. begin
  3187. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);
  3188. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);
  3189. end;
  3190. OP_ADD:
  3191. begin
  3192. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3193. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3194. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi));
  3195. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3196. end;
  3197. OP_SUB:
  3198. begin
  3199. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3200. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3201. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi));
  3202. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3203. end;
  3204. else
  3205. internalerror(2003083101);
  3206. end;
  3207. end;
  3208. end;
  3209. procedure tthumbcgarm.init_register_allocators;
  3210. begin
  3211. inherited init_register_allocators;
  3212. if assigned(current_procinfo) and (current_procinfo.framepointer=NR_R7) then
  3213. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3214. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6],first_int_imreg,[])
  3215. else
  3216. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3217. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7],first_int_imreg,[]);
  3218. end;
  3219. procedure tthumbcgarm.done_register_allocators;
  3220. begin
  3221. rg[R_INTREGISTER].free;
  3222. rg[R_FPUREGISTER].free;
  3223. rg[R_MMREGISTER].free;
  3224. inherited done_register_allocators;
  3225. end;
  3226. procedure tthumbcgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  3227. var
  3228. ref : treference;
  3229. shift : byte;
  3230. r : byte;
  3231. regs, saveregs : tcpuregisterset;
  3232. r7offset,
  3233. stackmisalignment : pint;
  3234. postfix: toppostfix;
  3235. registerarea,
  3236. imm1, imm2: DWord;
  3237. stack_parameters: Boolean;
  3238. begin
  3239. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3240. LocalSize:=align(LocalSize,4);
  3241. { call instruction does not put anything on the stack }
  3242. stackmisalignment:=0;
  3243. if not(nostackframe) then
  3244. begin
  3245. a_reg_alloc(list,NR_STACK_POINTER_REG);
  3246. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3247. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  3248. { save int registers }
  3249. reference_reset(ref,4);
  3250. ref.index:=NR_STACK_POINTER_REG;
  3251. ref.addressmode:=AM_PREINDEXED;
  3252. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3253. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3254. begin
  3255. //!!!! a_reg_alloc(list,NR_R12);
  3256. //!!!! list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  3257. end;
  3258. { the (old) ARM APCS requires saving both the stack pointer (to
  3259. crawl the stack) and the PC (to identify the function this
  3260. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  3261. and R15 -- still needs updating for EABI and Darwin, they don't
  3262. need that }
  3263. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3264. regs:=regs+[RS_R7,RS_R14]
  3265. else
  3266. // if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  3267. include(regs,RS_R14);
  3268. { safely estimate stack size }
  3269. if localsize+current_settings.alignment.localalignmax+4>508 then
  3270. begin
  3271. include(rg[R_INTREGISTER].used_in_proc,RS_R4);
  3272. include(regs,RS_R4);
  3273. end;
  3274. registerarea:=0;
  3275. if regs<>[] then
  3276. begin
  3277. for r:=RS_R0 to RS_R15 do
  3278. if r in regs then
  3279. inc(registerarea,4);
  3280. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,regs));
  3281. end;
  3282. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3283. if stack_parameters or (LocalSize<>0) or
  3284. ((stackmisalignment<>0) and
  3285. ((pi_do_call in current_procinfo.flags) or
  3286. (po_assembler in current_procinfo.procdef.procoptions))) then
  3287. begin
  3288. { do we access stack parameters?
  3289. if yes, the previously estimated stacksize must be used }
  3290. if stack_parameters then
  3291. begin
  3292. if localsize>tarmprocinfo(current_procinfo).stackframesize then
  3293. begin
  3294. writeln(localsize);
  3295. writeln(tarmprocinfo(current_procinfo).stackframesize);
  3296. internalerror(2013040601);
  3297. end
  3298. else
  3299. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea;
  3300. end
  3301. else
  3302. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3303. if localsize<508 then
  3304. begin
  3305. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  3306. end
  3307. else if localsize<=1016 then
  3308. begin
  3309. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3310. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize-508));
  3311. end
  3312. else
  3313. begin
  3314. a_load_const_reg(list,OS_ADDR,-localsize,NR_R4);
  3315. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R4));
  3316. include(regs,RS_R4);
  3317. //!!!! if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  3318. //!!!! a_reg_alloc(list,NR_R12);
  3319. //!!!! a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  3320. //!!!! list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  3321. //!!!! a_reg_dealloc(list,NR_R12);
  3322. end;
  3323. end;
  3324. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3325. begin
  3326. list.concat(taicpu.op_reg_reg_const(A_ADD,current_procinfo.framepointer,NR_STACK_POINTER_REG,0));
  3327. end;
  3328. end;
  3329. end;
  3330. procedure tthumbcgarm.g_proc_exit(list: TAsmList; parasize: longint; nostackframe: boolean);
  3331. var
  3332. ref : treference;
  3333. LocalSize : longint;
  3334. r,
  3335. shift : byte;
  3336. saveregs,
  3337. regs : tcpuregisterset;
  3338. registerarea : DWord;
  3339. stackmisalignment: pint;
  3340. imm1, imm2: DWord;
  3341. stack_parameters : Boolean;
  3342. begin
  3343. if not(nostackframe) then
  3344. begin
  3345. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3346. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3347. include(regs,RS_R15);
  3348. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3349. include(regs,getsupreg(current_procinfo.framepointer));
  3350. registerarea:=0;
  3351. for r:=RS_R0 to RS_R15 do
  3352. if r in regs then
  3353. inc(registerarea,4);
  3354. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3355. LocalSize:=current_procinfo.calc_stackframe_size;
  3356. if stack_parameters then
  3357. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea
  3358. else
  3359. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3360. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  3361. (target_info.system in systems_darwin) then
  3362. begin
  3363. if (LocalSize<>0) or
  3364. ((stackmisalignment<>0) and
  3365. ((pi_do_call in current_procinfo.flags) or
  3366. (po_assembler in current_procinfo.procdef.procoptions))) then
  3367. begin
  3368. if LocalSize=0 then
  3369. else if LocalSize<=508 then
  3370. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  3371. else if LocalSize<=1016 then
  3372. begin
  3373. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3374. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,localsize-508));
  3375. end
  3376. else
  3377. begin
  3378. a_reg_alloc(list,NR_R3);
  3379. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R3);
  3380. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R3));
  3381. a_reg_dealloc(list,NR_R3);
  3382. end;
  3383. end;
  3384. if regs=[] then
  3385. begin
  3386. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3387. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3388. else
  3389. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3390. end
  3391. else
  3392. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,regs));
  3393. end;
  3394. end
  3395. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3396. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3397. else
  3398. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3399. end;
  3400. procedure tthumbcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3401. var
  3402. oppostfix:toppostfix;
  3403. usedtmpref: treference;
  3404. tmpreg,tmpreg2 : tregister;
  3405. dir : integer;
  3406. begin
  3407. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3408. FromSize := ToSize;
  3409. case FromSize of
  3410. { signed integer registers }
  3411. OS_8:
  3412. oppostfix:=PF_B;
  3413. OS_S8:
  3414. oppostfix:=PF_SB;
  3415. OS_16:
  3416. oppostfix:=PF_H;
  3417. OS_S16:
  3418. oppostfix:=PF_SH;
  3419. OS_32,
  3420. OS_S32:
  3421. oppostfix:=PF_None;
  3422. else
  3423. InternalError(200308298);
  3424. end;
  3425. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3426. begin
  3427. if target_info.endian=endian_big then
  3428. dir:=-1
  3429. else
  3430. dir:=1;
  3431. case FromSize of
  3432. OS_16,OS_S16:
  3433. begin
  3434. { only complicated references need an extra loadaddr }
  3435. if assigned(ref.symbol) or
  3436. (ref.index<>NR_NO) or
  3437. (ref.offset<-124) or
  3438. (ref.offset>124) or
  3439. { sometimes the compiler reused registers }
  3440. (reg=ref.index) or
  3441. (reg=ref.base) then
  3442. begin
  3443. tmpreg2:=getintregister(list,OS_INT);
  3444. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3445. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3446. end
  3447. else
  3448. usedtmpref:=ref;
  3449. if target_info.endian=endian_big then
  3450. inc(usedtmpref.offset,1);
  3451. tmpreg:=getintregister(list,OS_INT);
  3452. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3453. inc(usedtmpref.offset,dir);
  3454. if FromSize=OS_16 then
  3455. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3456. else
  3457. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3458. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3459. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3460. end;
  3461. OS_32,OS_S32:
  3462. begin
  3463. tmpreg:=getintregister(list,OS_INT);
  3464. { only complicated references need an extra loadaddr }
  3465. if assigned(ref.symbol) or
  3466. (ref.index<>NR_NO) or
  3467. (ref.offset<-124) or
  3468. (ref.offset>124) or
  3469. { sometimes the compiler reused registers }
  3470. (reg=ref.index) or
  3471. (reg=ref.base) then
  3472. begin
  3473. tmpreg2:=getintregister(list,OS_INT);
  3474. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3475. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3476. end
  3477. else
  3478. usedtmpref:=ref;
  3479. if ref.alignment=2 then
  3480. begin
  3481. if target_info.endian=endian_big then
  3482. inc(usedtmpref.offset,2);
  3483. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  3484. inc(usedtmpref.offset,dir*2);
  3485. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  3486. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3487. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3488. end
  3489. else
  3490. begin
  3491. if target_info.endian=endian_big then
  3492. inc(usedtmpref.offset,3);
  3493. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3494. inc(usedtmpref.offset,dir);
  3495. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3496. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3497. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3498. inc(usedtmpref.offset,dir);
  3499. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3500. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3501. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3502. inc(usedtmpref.offset,dir);
  3503. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3504. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,24));
  3505. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3506. end;
  3507. end
  3508. else
  3509. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3510. end;
  3511. end
  3512. else
  3513. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3514. if (fromsize=OS_S8) and (tosize = OS_16) then
  3515. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  3516. end;
  3517. procedure tthumbcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3518. var
  3519. imm_shift : byte;
  3520. l : tasmlabel;
  3521. hr : treference;
  3522. begin
  3523. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3524. internalerror(2002090902);
  3525. if is_thumb_imm(a) then
  3526. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3527. else
  3528. begin
  3529. reference_reset(hr,4);
  3530. current_asmdata.getjumplabel(l);
  3531. cg.a_label(current_procinfo.aktlocaldata,l);
  3532. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3533. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3534. hr.symbol:=l;
  3535. hr.base:=NR_PC;
  3536. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3537. end;
  3538. end;
  3539. procedure tthumbcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  3540. var
  3541. hsym : tsym;
  3542. href,
  3543. tmpref : treference;
  3544. paraloc : Pcgparalocation;
  3545. l : TAsmLabel;
  3546. begin
  3547. { calculate the parameter info for the procdef }
  3548. procdef.init_paraloc_info(callerside);
  3549. hsym:=tsym(procdef.parast.Find('self'));
  3550. if not(assigned(hsym) and
  3551. (hsym.typ=paravarsym)) then
  3552. internalerror(200305251);
  3553. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  3554. while paraloc<>nil do
  3555. with paraloc^ do
  3556. begin
  3557. case loc of
  3558. LOC_REGISTER:
  3559. begin
  3560. if is_thumb_imm(ioffset) then
  3561. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  3562. else
  3563. begin
  3564. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3565. reference_reset(tmpref,4);
  3566. current_asmdata.getjumplabel(l);
  3567. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3568. cg.a_label(current_procinfo.aktlocaldata,l);
  3569. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3570. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3571. tmpref.symbol:=l;
  3572. tmpref.base:=NR_PC;
  3573. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3574. a_op_reg_reg(list,OP_SUB,size,NR_R4,register);
  3575. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3576. end;
  3577. end;
  3578. LOC_REFERENCE:
  3579. begin
  3580. { offset in the wrapper needs to be adjusted for the stored
  3581. return address }
  3582. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),sizeof(pint));
  3583. if is_thumb_imm(ioffset) then
  3584. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  3585. else
  3586. begin
  3587. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3588. reference_reset(tmpref,4);
  3589. current_asmdata.getjumplabel(l);
  3590. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3591. cg.a_label(current_procinfo.aktlocaldata,l);
  3592. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3593. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3594. tmpref.symbol:=l;
  3595. tmpref.base:=NR_PC;
  3596. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3597. a_op_reg_ref(list,OP_SUB,size,NR_R4,href);
  3598. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3599. end;
  3600. end
  3601. else
  3602. internalerror(200309189);
  3603. end;
  3604. paraloc:=next;
  3605. end;
  3606. end;
  3607. function tthumbcgarm.handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference;
  3608. var
  3609. href : treference;
  3610. tmpreg : TRegister;
  3611. begin
  3612. href:=ref;
  3613. if { LDR/STR limitations }
  3614. (
  3615. (((op=A_LDR) and (oppostfix=PF_None)) or
  3616. ((op=A_STR) and (oppostfix=PF_None))) and
  3617. (ref.base<>NR_STACK_POINTER_REG) and
  3618. (abs(ref.offset)>124)
  3619. ) or
  3620. { LDRB/STRB limitations }
  3621. (
  3622. (((op=A_LDR) and (oppostfix=PF_B)) or
  3623. ((op=A_LDRB) and (oppostfix=PF_None)) or
  3624. ((op=A_STR) and (oppostfix=PF_B)) or
  3625. ((op=A_STRB) and (oppostfix=PF_None))) and
  3626. ((ref.base=NR_STACK_POINTER_REG) or
  3627. (ref.index=NR_STACK_POINTER_REG) or
  3628. (abs(ref.offset)>31)
  3629. )
  3630. ) or
  3631. { LDRH/STRH limitations }
  3632. (
  3633. (((op=A_LDR) and (oppostfix=PF_H)) or
  3634. ((op=A_LDRH) and (oppostfix=PF_None)) or
  3635. ((op=A_STR) and (oppostfix=PF_H)) or
  3636. ((op=A_STRH) and (oppostfix=PF_None))) and
  3637. ((ref.base=NR_STACK_POINTER_REG) or
  3638. (ref.index=NR_STACK_POINTER_REG) or
  3639. (abs(ref.offset)>62) or
  3640. ((abs(ref.offset) mod 2)<>0)
  3641. )
  3642. ) then
  3643. begin
  3644. tmpreg:=getintregister(list,OS_ADDR);
  3645. a_loadaddr_ref_reg(list,ref,tmpreg);
  3646. reference_reset_base(href,tmpreg,0,ref.alignment);
  3647. end
  3648. else if (op=A_LDR) and
  3649. (oppostfix in [PF_None]) and
  3650. (ref.base=NR_STACK_POINTER_REG) and
  3651. (abs(ref.offset)>1020) then
  3652. begin
  3653. tmpreg:=getintregister(list,OS_ADDR);
  3654. a_loadaddr_ref_reg(list,ref,tmpreg);
  3655. reference_reset_base(href,tmpreg,0,ref.alignment);
  3656. end
  3657. else if (op=A_LDR) and
  3658. ((oppostfix in [PF_SH,PF_SB]) or
  3659. (abs(ref.offset)>124)) then
  3660. begin
  3661. tmpreg:=getintregister(list,OS_ADDR);
  3662. a_loadaddr_ref_reg(list,ref,tmpreg);
  3663. reference_reset_base(href,tmpreg,0,ref.alignment);
  3664. end;
  3665. Result:=inherited handle_load_store(list, op, oppostfix, reg, href);
  3666. end;
  3667. procedure tthumbcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  3668. var
  3669. tmpreg,overflowreg : tregister;
  3670. asmop : tasmop;
  3671. begin
  3672. case op of
  3673. OP_NEG:
  3674. list.concat(taicpu.op_reg_reg(A_NEG,dst,src));
  3675. OP_NOT:
  3676. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  3677. OP_DIV,OP_IDIV:
  3678. internalerror(200308284);
  3679. OP_ROL:
  3680. begin
  3681. if not(size in [OS_32,OS_S32]) then
  3682. internalerror(2008072801);
  3683. { simulate ROL by ror'ing 32-value }
  3684. tmpreg:=getintregister(list,OS_32);
  3685. a_load_const_reg(list,OS_32,32,tmpreg);
  3686. list.concat(taicpu.op_reg_reg(A_SUB,tmpreg,src));
  3687. list.concat(taicpu.op_reg_reg(A_ROR,dst,src));
  3688. end;
  3689. else
  3690. begin
  3691. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3692. list.concat(setoppostfix(
  3693. taicpu.op_reg_reg(op_reg_opcg2asmop[op],dst,src),op_reg_postfix[op]));
  3694. end;
  3695. end;
  3696. maybeadjustresult(list,op,size,dst);
  3697. end;
  3698. procedure tthumbcgarm.a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);
  3699. var
  3700. tmpreg : tregister;
  3701. so : tshifterop;
  3702. l1 : longint;
  3703. imm1, imm2: DWord;
  3704. begin
  3705. //!!! ovloc.loc:=LOC_VOID;
  3706. if {$ifopt R+}(a<>-2147483648) and{$endif} {!!!!!! not setflags and } is_thumb_imm(-a) then
  3707. case op of
  3708. OP_ADD:
  3709. begin
  3710. op:=OP_SUB;
  3711. a:=aint(dword(-a));
  3712. end;
  3713. OP_SUB:
  3714. begin
  3715. op:=OP_ADD;
  3716. a:=aint(dword(-a));
  3717. end
  3718. end;
  3719. if is_thumb_imm(a) and (op in [OP_ADD,OP_SUB]) then
  3720. begin
  3721. // if cgsetflags or setflags then
  3722. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3723. list.concat(setoppostfix(
  3724. taicpu.op_reg_const(op_reg_opcg2asmop[op],dst,a),op_reg_postfix[op]));
  3725. if (cgsetflags {!!! or setflags }) and (size in [OS_8,OS_16,OS_32]) then
  3726. begin
  3727. //!!! ovloc.loc:=LOC_FLAGS;
  3728. case op of
  3729. OP_ADD:
  3730. //!!! ovloc.resflags:=F_CS;
  3731. ;
  3732. OP_SUB:
  3733. //!!! ovloc.resflags:=F_CC;
  3734. ;
  3735. end;
  3736. end;
  3737. end
  3738. else
  3739. begin
  3740. { there could be added some more sophisticated optimizations }
  3741. if (op in [OP_MUL,OP_IMUL,OP_DIV,OP_IDIV]) and (a=1) then
  3742. a_load_reg_reg(list,size,size,dst,dst)
  3743. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  3744. a_load_const_reg(list,size,0,dst)
  3745. else if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  3746. a_op_reg_reg(list,OP_NEG,size,dst,dst)
  3747. { we do this here instead in the peephole optimizer because
  3748. it saves us a register }
  3749. {$ifdef DUMMY}
  3750. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  3751. a_op_const_reg_reg(list,OP_SHL,size,l1,dst,dst)
  3752. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  3753. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  3754. begin
  3755. if l1>32 then{roozbeh does this ever happen?}
  3756. internalerror(200308296);
  3757. shifterop_reset(so);
  3758. so.shiftmode:=SM_LSL;
  3759. so.shiftimm:=l1;
  3760. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,dst,so));
  3761. end
  3762. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  3763. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  3764. begin
  3765. if l1>32 then{does this ever happen?}
  3766. internalerror(201205181);
  3767. shifterop_reset(so);
  3768. so.shiftmode:=SM_LSL;
  3769. so.shiftimm:=l1;
  3770. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,dst,dst,so));
  3771. end
  3772. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,dst,dst) then
  3773. begin
  3774. { nothing to do on success }
  3775. end
  3776. {$endif DUMMY}
  3777. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  3778. Just using mov x, #0 might allow some easier optimizations down the line. }
  3779. else if (op = OP_AND) and (dword(a)=0) then
  3780. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  3781. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  3782. else if (op = OP_AND) and (not(dword(a))=0) then
  3783. // do nothing
  3784. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  3785. broader range of shifterconstants.}
  3786. {$ifdef DUMMY}
  3787. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  3788. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,not(dword(a))))
  3789. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  3790. begin
  3791. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm1));
  3792. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  3793. end
  3794. else if (op in [OP_ADD, OP_SUB, OP_OR]) and
  3795. not(cgsetflags or setflags) and
  3796. split_into_shifter_const(a, imm1, imm2) then
  3797. begin
  3798. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm1));
  3799. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  3800. end
  3801. {$endif DUMMY}
  3802. else if (op in [OP_SHL, OP_SHR, OP_SAR]) then
  3803. begin
  3804. list.concat(taicpu.op_reg_reg_const(op_reg_opcg2asmop[op],dst,dst,a));
  3805. end
  3806. else
  3807. begin
  3808. tmpreg:=getintregister(list,size);
  3809. a_load_const_reg(list,size,a,tmpreg);
  3810. a_op_reg_reg(list,op,size,tmpreg,dst);
  3811. end;
  3812. end;
  3813. maybeadjustresult(list,op,size,dst);
  3814. end;
  3815. procedure tthumbcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister);
  3816. begin
  3817. if (op=OP_ADD) and (src=NR_R13) and (dst<>NR_R13) and ((a mod 4)=0) and (a>0) and (a<=1020) then
  3818. list.concat(taicpu.op_reg_reg_const(A_ADD,dst,src,a))
  3819. else
  3820. inherited a_op_const_reg_reg(list,op,size,a,src,dst);
  3821. end;
  3822. procedure tthumbcgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  3823. var
  3824. l1,l2 : tasmlabel;
  3825. ai : taicpu;
  3826. begin
  3827. current_asmdata.getjumplabel(l1);
  3828. current_asmdata.getjumplabel(l2);
  3829. ai:=setcondition(taicpu.op_sym(A_B,l1),flags_to_cond(f));
  3830. ai.is_jmp:=true;
  3831. list.concat(ai);
  3832. list.concat(taicpu.op_reg_const(A_MOV,reg,0));
  3833. list.concat(taicpu.op_sym(A_B,l2));
  3834. cg.a_label(list,l1);
  3835. list.concat(taicpu.op_reg_const(A_MOV,reg,1));
  3836. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3837. cg.a_label(list,l2);
  3838. end;
  3839. procedure tthumb2cgarm.init_register_allocators;
  3840. begin
  3841. inherited init_register_allocators;
  3842. { currently, we save R14 always, so we can use it }
  3843. if (target_info.system<>system_arm_darwin) then
  3844. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3845. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3846. RS_R9,RS_R10,RS_R12,RS_R14],first_int_imreg,[])
  3847. else
  3848. { r9 is not available on Darwin according to the llvm code generator }
  3849. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3850. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3851. RS_R10,RS_R12,RS_R14],first_int_imreg,[]);
  3852. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  3853. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  3854. if current_settings.fputype=fpu_vfpv3 then
  3855. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3856. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3857. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  3858. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3859. ],first_mm_imreg,[])
  3860. else if current_settings.fputype in [fpu_fpv4_s16,fpu_vfpv3_d16] then
  3861. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3862. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3863. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3864. ],first_mm_imreg,[])
  3865. else
  3866. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBNONE,
  3867. [RS_S0,RS_S1,RS_R2,RS_R3,RS_R4,RS_S31],first_mm_imreg,[]);
  3868. end;
  3869. procedure tthumb2cgarm.done_register_allocators;
  3870. begin
  3871. rg[R_INTREGISTER].free;
  3872. rg[R_FPUREGISTER].free;
  3873. rg[R_MMREGISTER].free;
  3874. inherited done_register_allocators;
  3875. end;
  3876. procedure tthumb2cgarm.a_call_reg(list : TAsmList;reg: tregister);
  3877. begin
  3878. list.concat(taicpu.op_reg(A_BLX, reg));
  3879. {
  3880. the compiler does not properly set this flag anymore in pass 1, and
  3881. for now we only need it after pass 2 (I hope) (JM)
  3882. if not(pi_do_call in current_procinfo.flags) then
  3883. internalerror(2003060703);
  3884. }
  3885. include(current_procinfo.flags,pi_do_call);
  3886. end;
  3887. procedure tthumb2cgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3888. var
  3889. imm_shift : byte;
  3890. l : tasmlabel;
  3891. hr : treference;
  3892. begin
  3893. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3894. internalerror(2002090902);
  3895. if is_thumb32_imm(a) then
  3896. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3897. else if is_thumb32_imm(not(a)) then
  3898. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  3899. else if (a and $FFFF)=a then
  3900. list.concat(taicpu.op_reg_const(A_MOVW,reg,a))
  3901. else
  3902. begin
  3903. reference_reset(hr,4);
  3904. current_asmdata.getjumplabel(l);
  3905. cg.a_label(current_procinfo.aktlocaldata,l);
  3906. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3907. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3908. hr.symbol:=l;
  3909. hr.base:=NR_PC;
  3910. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3911. end;
  3912. end;
  3913. procedure tthumb2cgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3914. var
  3915. oppostfix:toppostfix;
  3916. usedtmpref: treference;
  3917. tmpreg,tmpreg2 : tregister;
  3918. so : tshifterop;
  3919. dir : integer;
  3920. begin
  3921. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3922. FromSize := ToSize;
  3923. case FromSize of
  3924. { signed integer registers }
  3925. OS_8:
  3926. oppostfix:=PF_B;
  3927. OS_S8:
  3928. oppostfix:=PF_SB;
  3929. OS_16:
  3930. oppostfix:=PF_H;
  3931. OS_S16:
  3932. oppostfix:=PF_SH;
  3933. OS_32,
  3934. OS_S32:
  3935. oppostfix:=PF_None;
  3936. else
  3937. InternalError(200308299);
  3938. end;
  3939. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3940. begin
  3941. if target_info.endian=endian_big then
  3942. dir:=-1
  3943. else
  3944. dir:=1;
  3945. case FromSize of
  3946. OS_16,OS_S16:
  3947. begin
  3948. { only complicated references need an extra loadaddr }
  3949. if assigned(ref.symbol) or
  3950. (ref.index<>NR_NO) or
  3951. (ref.offset<-255) or
  3952. (ref.offset>4094) or
  3953. { sometimes the compiler reused registers }
  3954. (reg=ref.index) or
  3955. (reg=ref.base) then
  3956. begin
  3957. tmpreg2:=getintregister(list,OS_INT);
  3958. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3959. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3960. end
  3961. else
  3962. usedtmpref:=ref;
  3963. if target_info.endian=endian_big then
  3964. inc(usedtmpref.offset,1);
  3965. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  3966. tmpreg:=getintregister(list,OS_INT);
  3967. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3968. inc(usedtmpref.offset,dir);
  3969. if FromSize=OS_16 then
  3970. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3971. else
  3972. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3973. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  3974. end;
  3975. OS_32,OS_S32:
  3976. begin
  3977. tmpreg:=getintregister(list,OS_INT);
  3978. { only complicated references need an extra loadaddr }
  3979. if assigned(ref.symbol) or
  3980. (ref.index<>NR_NO) or
  3981. (ref.offset<-255) or
  3982. (ref.offset>4092) or
  3983. { sometimes the compiler reused registers }
  3984. (reg=ref.index) or
  3985. (reg=ref.base) then
  3986. begin
  3987. tmpreg2:=getintregister(list,OS_INT);
  3988. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3989. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3990. end
  3991. else
  3992. usedtmpref:=ref;
  3993. shifterop_reset(so);so.shiftmode:=SM_LSL;
  3994. if ref.alignment=2 then
  3995. begin
  3996. if target_info.endian=endian_big then
  3997. inc(usedtmpref.offset,2);
  3998. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  3999. inc(usedtmpref.offset,dir*2);
  4000. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  4001. so.shiftimm:=16;
  4002. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4003. end
  4004. else
  4005. begin
  4006. if target_info.endian=endian_big then
  4007. inc(usedtmpref.offset,3);
  4008. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  4009. inc(usedtmpref.offset,dir);
  4010. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4011. so.shiftimm:=8;
  4012. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4013. inc(usedtmpref.offset,dir);
  4014. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4015. so.shiftimm:=16;
  4016. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4017. inc(usedtmpref.offset,dir);
  4018. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4019. so.shiftimm:=24;
  4020. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4021. end;
  4022. end
  4023. else
  4024. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4025. end;
  4026. end
  4027. else
  4028. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4029. if (fromsize=OS_S8) and (tosize = OS_16) then
  4030. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  4031. end;
  4032. procedure tthumb2cgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  4033. begin
  4034. if op = OP_NOT then
  4035. begin
  4036. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  4037. case size of
  4038. OS_8: list.concat(taicpu.op_reg_reg(A_UXTB,dst,dst));
  4039. OS_S8: list.concat(taicpu.op_reg_reg(A_SXTB,dst,dst));
  4040. OS_16: list.concat(taicpu.op_reg_reg(A_UXTH,dst,dst));
  4041. OS_S16: list.concat(taicpu.op_reg_reg(A_SXTH,dst,dst));
  4042. end;
  4043. end
  4044. else
  4045. inherited a_op_reg_reg(list, op, size, src, dst);
  4046. end;
  4047. procedure tthumb2cgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4048. var
  4049. shift, width : byte;
  4050. tmpreg : tregister;
  4051. so : tshifterop;
  4052. l1 : longint;
  4053. begin
  4054. ovloc.loc:=LOC_VOID;
  4055. if {$ifopt R+}(a<>-2147483648) and{$endif} is_shifter_const(-a,shift) then
  4056. case op of
  4057. OP_ADD:
  4058. begin
  4059. op:=OP_SUB;
  4060. a:=aint(dword(-a));
  4061. end;
  4062. OP_SUB:
  4063. begin
  4064. op:=OP_ADD;
  4065. a:=aint(dword(-a));
  4066. end
  4067. end;
  4068. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  4069. case op of
  4070. OP_NEG,OP_NOT,
  4071. OP_DIV,OP_IDIV:
  4072. internalerror(200308285);
  4073. OP_SHL:
  4074. begin
  4075. if a>32 then
  4076. internalerror(2014020703);
  4077. if a<>0 then
  4078. begin
  4079. shifterop_reset(so);
  4080. so.shiftmode:=SM_LSL;
  4081. so.shiftimm:=a;
  4082. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4083. end
  4084. else
  4085. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4086. end;
  4087. OP_ROL:
  4088. begin
  4089. if a>32 then
  4090. internalerror(2014020704);
  4091. if a<>0 then
  4092. begin
  4093. shifterop_reset(so);
  4094. so.shiftmode:=SM_ROR;
  4095. so.shiftimm:=32-a;
  4096. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4097. end
  4098. else
  4099. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4100. end;
  4101. OP_ROR:
  4102. begin
  4103. if a>32 then
  4104. internalerror(2014020705);
  4105. if a<>0 then
  4106. begin
  4107. shifterop_reset(so);
  4108. so.shiftmode:=SM_ROR;
  4109. so.shiftimm:=a;
  4110. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4111. end
  4112. else
  4113. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4114. end;
  4115. OP_SHR:
  4116. begin
  4117. if a>32 then
  4118. internalerror(200308292);
  4119. shifterop_reset(so);
  4120. if a<>0 then
  4121. begin
  4122. so.shiftmode:=SM_LSR;
  4123. so.shiftimm:=a;
  4124. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4125. end
  4126. else
  4127. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4128. end;
  4129. OP_SAR:
  4130. begin
  4131. if a>32 then
  4132. internalerror(200308295);
  4133. if a<>0 then
  4134. begin
  4135. shifterop_reset(so);
  4136. so.shiftmode:=SM_ASR;
  4137. so.shiftimm:=a;
  4138. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4139. end
  4140. else
  4141. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4142. end;
  4143. else
  4144. if (op in [OP_SUB, OP_ADD]) and
  4145. ((a < 0) or
  4146. (a > 4095)) then
  4147. begin
  4148. tmpreg:=getintregister(list,size);
  4149. a_load_const_reg(list, size, a, tmpreg);
  4150. if cgsetflags or setflags then
  4151. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4152. list.concat(setoppostfix(
  4153. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4154. end
  4155. else
  4156. begin
  4157. if cgsetflags or setflags then
  4158. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4159. list.concat(setoppostfix(
  4160. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4161. end;
  4162. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  4163. begin
  4164. ovloc.loc:=LOC_FLAGS;
  4165. case op of
  4166. OP_ADD:
  4167. ovloc.resflags:=F_CS;
  4168. OP_SUB:
  4169. ovloc.resflags:=F_CC;
  4170. end;
  4171. end;
  4172. end
  4173. else
  4174. begin
  4175. { there could be added some more sophisticated optimizations }
  4176. if (op in [OP_MUL,OP_IMUL]) and (a=1) then
  4177. a_load_reg_reg(list,size,size,src,dst)
  4178. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  4179. a_load_const_reg(list,size,0,dst)
  4180. else if (op in [OP_IMUL]) and (a=-1) then
  4181. a_op_reg_reg(list,OP_NEG,size,src,dst)
  4182. { we do this here instead in the peephole optimizer because
  4183. it saves us a register }
  4184. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  4185. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  4186. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  4187. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  4188. begin
  4189. if l1>32 then{roozbeh does this ever happen?}
  4190. internalerror(200308296);
  4191. shifterop_reset(so);
  4192. so.shiftmode:=SM_LSL;
  4193. so.shiftimm:=l1;
  4194. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  4195. end
  4196. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  4197. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  4198. begin
  4199. if l1>32 then{does this ever happen?}
  4200. internalerror(201205181);
  4201. shifterop_reset(so);
  4202. so.shiftmode:=SM_LSL;
  4203. so.shiftimm:=l1;
  4204. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  4205. end
  4206. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  4207. begin
  4208. { nothing to do on success }
  4209. end
  4210. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  4211. Just using mov x, #0 might allow some easier optimizations down the line. }
  4212. else if (op = OP_AND) and (dword(a)=0) then
  4213. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  4214. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  4215. else if (op = OP_AND) and (not(dword(a))=0) then
  4216. list.concat(taicpu.op_reg_reg(A_MOV,dst,src))
  4217. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  4218. broader range of shifterconstants.}
  4219. {else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  4220. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))}
  4221. else if (op = OP_AND) and is_thumb32_imm(a) then
  4222. list.concat(taicpu.op_reg_reg_const(A_AND,dst,src,dword(a)))
  4223. else if (op = OP_AND) and (a = $FFFF) then
  4224. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  4225. else if (op = OP_AND) and is_thumb32_imm(not(dword(a))) then
  4226. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  4227. else if (op = OP_AND) and is_continuous_mask(not(a), shift, width) then
  4228. begin
  4229. a_load_reg_reg(list,size,size,src,dst);
  4230. list.concat(taicpu.op_reg_const_const(A_BFC,dst,shift,width))
  4231. end
  4232. else
  4233. begin
  4234. tmpreg:=getintregister(list,size);
  4235. a_load_const_reg(list,size,a,tmpreg);
  4236. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  4237. end;
  4238. end;
  4239. maybeadjustresult(list,op,size,dst);
  4240. end;
  4241. const
  4242. op_reg_reg_opcg2asmopThumb2: array[TOpCG] of tasmop =
  4243. (A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NONE,A_MVN,A_ORR,
  4244. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  4245. procedure tthumb2cgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4246. var
  4247. so : tshifterop;
  4248. tmpreg,overflowreg : tregister;
  4249. asmop : tasmop;
  4250. begin
  4251. ovloc.loc:=LOC_VOID;
  4252. case op of
  4253. OP_NEG,OP_NOT:
  4254. internalerror(200308286);
  4255. OP_ROL:
  4256. begin
  4257. if not(size in [OS_32,OS_S32]) then
  4258. internalerror(2008072801);
  4259. { simulate ROL by ror'ing 32-value }
  4260. tmpreg:=getintregister(list,OS_32);
  4261. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,32));
  4262. list.concat(taicpu.op_reg_reg_reg(A_SUB,src1,tmpreg,src1));
  4263. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4264. end;
  4265. OP_ROR:
  4266. begin
  4267. if not(size in [OS_32,OS_S32]) then
  4268. internalerror(2008072802);
  4269. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4270. end;
  4271. OP_IMUL,
  4272. OP_MUL:
  4273. begin
  4274. if cgsetflags or setflags then
  4275. begin
  4276. overflowreg:=getintregister(list,size);
  4277. if op=OP_IMUL then
  4278. asmop:=A_SMULL
  4279. else
  4280. asmop:=A_UMULL;
  4281. { the arm doesn't allow that rd and rm are the same }
  4282. if dst=src2 then
  4283. begin
  4284. if dst<>src1 then
  4285. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  4286. else
  4287. begin
  4288. tmpreg:=getintregister(list,size);
  4289. a_load_reg_reg(list,size,size,src2,dst);
  4290. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  4291. end;
  4292. end
  4293. else
  4294. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  4295. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4296. if op=OP_IMUL then
  4297. begin
  4298. shifterop_reset(so);
  4299. so.shiftmode:=SM_ASR;
  4300. so.shiftimm:=31;
  4301. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  4302. end
  4303. else
  4304. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  4305. ovloc.loc:=LOC_FLAGS;
  4306. ovloc.resflags:=F_NE;
  4307. end
  4308. else
  4309. begin
  4310. { the arm doesn't allow that rd and rm are the same }
  4311. if dst=src2 then
  4312. begin
  4313. if dst<>src1 then
  4314. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  4315. else
  4316. begin
  4317. tmpreg:=getintregister(list,size);
  4318. a_load_reg_reg(list,size,size,src2,dst);
  4319. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  4320. end;
  4321. end
  4322. else
  4323. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  4324. end;
  4325. end;
  4326. else
  4327. begin
  4328. if cgsetflags or setflags then
  4329. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4330. {$ifdef dummy}
  4331. { R13 is not allowed for certain instruction operands }
  4332. if op_reg_reg_opcg2asmopThumb2[op] in [A_ADD,A_SUB,A_AND,A_BIC,A_EOR] then
  4333. begin
  4334. if getsupreg(dst)=RS_R13 then
  4335. begin
  4336. tmpreg:=getintregister(list,OS_INT);
  4337. a_load_reg_reg(list,OS_INT,OS_INT,dst,tmpreg);
  4338. dst:=tmpreg;
  4339. end;
  4340. if getsupreg(src1)=RS_R13 then
  4341. begin
  4342. tmpreg:=getintregister(list,OS_INT);
  4343. a_load_reg_reg(list,OS_INT,OS_INT,src1,tmpreg);
  4344. src1:=tmpreg;
  4345. end;
  4346. end;
  4347. {$endif}
  4348. list.concat(setoppostfix(
  4349. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmopThumb2[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4350. end;
  4351. end;
  4352. maybeadjustresult(list,op,size,dst);
  4353. end;
  4354. procedure tthumb2cgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  4355. var item: taicpu;
  4356. begin
  4357. list.concat(taicpu.op_cond(A_ITE, flags_to_cond(f)));
  4358. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  4359. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  4360. end;
  4361. procedure tthumb2cgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  4362. var
  4363. ref : treference;
  4364. shift : byte;
  4365. firstfloatreg,lastfloatreg,
  4366. r : byte;
  4367. regs : tcpuregisterset;
  4368. stackmisalignment: pint;
  4369. begin
  4370. LocalSize:=align(LocalSize,4);
  4371. { call instruction does not put anything on the stack }
  4372. stackmisalignment:=0;
  4373. if not(nostackframe) then
  4374. begin
  4375. firstfloatreg:=RS_NO;
  4376. lastfloatreg:=RS_NO;
  4377. { save floating point registers? }
  4378. for r:=RS_F0 to RS_F7 do
  4379. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4380. begin
  4381. if firstfloatreg=RS_NO then
  4382. firstfloatreg:=r;
  4383. lastfloatreg:=r;
  4384. inc(stackmisalignment,12);
  4385. end;
  4386. a_reg_alloc(list,NR_STACK_POINTER_REG);
  4387. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4388. begin
  4389. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  4390. a_reg_alloc(list,NR_R12);
  4391. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  4392. end;
  4393. { save int registers }
  4394. reference_reset(ref,4);
  4395. ref.index:=NR_STACK_POINTER_REG;
  4396. ref.addressmode:=AM_PREINDEXED;
  4397. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4398. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4399. regs:=regs+[RS_FRAME_POINTER_REG,RS_R14]
  4400. else if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  4401. include(regs,RS_R14);
  4402. if regs<>[] then
  4403. begin
  4404. for r:=RS_R0 to RS_R15 do
  4405. if (r in regs) then
  4406. inc(stackmisalignment,4);
  4407. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4408. end;
  4409. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4410. begin
  4411. { the framepointer now points to the saved R15, so the saved
  4412. framepointer is at R11-12 (for get_caller_frame) }
  4413. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  4414. a_reg_dealloc(list,NR_R12);
  4415. end;
  4416. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4417. if (LocalSize<>0) or
  4418. ((stackmisalignment<>0) and
  4419. ((pi_do_call in current_procinfo.flags) or
  4420. (po_assembler in current_procinfo.procdef.procoptions))) then
  4421. begin
  4422. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4423. if not(is_shifter_const(localsize,shift)) then
  4424. begin
  4425. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  4426. a_reg_alloc(list,NR_R12);
  4427. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4428. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  4429. a_reg_dealloc(list,NR_R12);
  4430. end
  4431. else
  4432. begin
  4433. a_reg_dealloc(list,NR_R12);
  4434. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  4435. end;
  4436. end;
  4437. if firstfloatreg<>RS_NO then
  4438. begin
  4439. reference_reset(ref,4);
  4440. if tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023 then
  4441. begin
  4442. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  4443. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4444. ref.base:=NR_R12;
  4445. end
  4446. else
  4447. begin
  4448. ref.base:=current_procinfo.framepointer;
  4449. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  4450. end;
  4451. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4452. lastfloatreg-firstfloatreg+1,ref));
  4453. end;
  4454. end;
  4455. end;
  4456. procedure tthumb2cgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  4457. var
  4458. ref : treference;
  4459. firstfloatreg,lastfloatreg,
  4460. r : byte;
  4461. shift : byte;
  4462. regs : tcpuregisterset;
  4463. LocalSize : longint;
  4464. stackmisalignment: pint;
  4465. begin
  4466. if not(nostackframe) then
  4467. begin
  4468. stackmisalignment:=0;
  4469. { restore floating point register }
  4470. firstfloatreg:=RS_NO;
  4471. lastfloatreg:=RS_NO;
  4472. { save floating point registers? }
  4473. for r:=RS_F0 to RS_F7 do
  4474. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4475. begin
  4476. if firstfloatreg=RS_NO then
  4477. firstfloatreg:=r;
  4478. lastfloatreg:=r;
  4479. { floating point register space is already included in
  4480. localsize below by calc_stackframe_size
  4481. inc(stackmisalignment,12);
  4482. }
  4483. end;
  4484. if firstfloatreg<>RS_NO then
  4485. begin
  4486. reference_reset(ref,4);
  4487. if tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023 then
  4488. begin
  4489. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  4490. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4491. ref.base:=NR_R12;
  4492. end
  4493. else
  4494. begin
  4495. ref.base:=current_procinfo.framepointer;
  4496. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  4497. end;
  4498. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4499. lastfloatreg-firstfloatreg+1,ref));
  4500. end;
  4501. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4502. if (pi_do_call in current_procinfo.flags) or (regs<>[]) then
  4503. begin
  4504. exclude(regs,RS_R14);
  4505. include(regs,RS_R15);
  4506. end;
  4507. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  4508. regs:=regs+[RS_FRAME_POINTER_REG,RS_R15];
  4509. for r:=RS_R0 to RS_R15 do
  4510. if (r in regs) then
  4511. inc(stackmisalignment,4);
  4512. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4513. LocalSize:=current_procinfo.calc_stackframe_size;
  4514. if (LocalSize<>0) or
  4515. ((stackmisalignment<>0) and
  4516. ((pi_do_call in current_procinfo.flags) or
  4517. (po_assembler in current_procinfo.procdef.procoptions))) then
  4518. begin
  4519. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4520. if not(is_shifter_const(LocalSize,shift)) then
  4521. begin
  4522. a_reg_alloc(list,NR_R12);
  4523. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4524. list.concat(taicpu.op_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_R12));
  4525. a_reg_dealloc(list,NR_R12);
  4526. end
  4527. else
  4528. begin
  4529. a_reg_dealloc(list,NR_R12);
  4530. list.concat(taicpu.op_reg_const(A_ADD,NR_STACK_POINTER_REG,LocalSize));
  4531. end;
  4532. end;
  4533. if regs=[] then
  4534. list.concat(taicpu.op_reg_reg(A_MOV,NR_R15,NR_R14))
  4535. else
  4536. begin
  4537. reference_reset(ref,4);
  4538. ref.index:=NR_STACK_POINTER_REG;
  4539. ref.addressmode:=AM_PREINDEXED;
  4540. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4541. end;
  4542. end
  4543. else
  4544. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14));
  4545. end;
  4546. function tthumb2cgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  4547. var
  4548. tmpreg : tregister;
  4549. tmpref : treference;
  4550. l : tasmlabel;
  4551. so: tshifterop;
  4552. begin
  4553. tmpreg:=NR_NO;
  4554. { Be sure to have a base register }
  4555. if (ref.base=NR_NO) then
  4556. begin
  4557. if ref.shiftmode<>SM_None then
  4558. internalerror(2014020706);
  4559. ref.base:=ref.index;
  4560. ref.index:=NR_NO;
  4561. end;
  4562. { absolute symbols can't be handled directly, we've to store the symbol reference
  4563. in the text segment and access it pc relative
  4564. For now, we assume that references where base or index equals to PC are already
  4565. relative, all other references are assumed to be absolute and thus they need
  4566. to be handled extra.
  4567. A proper solution would be to change refoptions to a set and store the information
  4568. if the symbol is absolute or relative there.
  4569. }
  4570. if (assigned(ref.symbol) and
  4571. not(is_pc(ref.base)) and
  4572. not(is_pc(ref.index))
  4573. ) or
  4574. { [#xxx] isn't a valid address operand }
  4575. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  4576. //(ref.offset<-4095) or
  4577. (ref.offset<-255) or
  4578. (ref.offset>4095) or
  4579. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  4580. ((ref.offset<-255) or
  4581. (ref.offset>255)
  4582. )
  4583. ) or
  4584. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  4585. ((ref.offset<-1020) or
  4586. (ref.offset>1020) or
  4587. ((abs(ref.offset) mod 4)<>0) or
  4588. { the usual pc relative symbol handling assumes possible offsets of +/- 4095 }
  4589. assigned(ref.symbol)
  4590. )
  4591. ) then
  4592. begin
  4593. reference_reset(tmpref,4);
  4594. { load symbol }
  4595. tmpreg:=getintregister(list,OS_INT);
  4596. if assigned(ref.symbol) then
  4597. begin
  4598. current_asmdata.getjumplabel(l);
  4599. cg.a_label(current_procinfo.aktlocaldata,l);
  4600. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  4601. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset));
  4602. { load consts entry }
  4603. tmpref.symbol:=l;
  4604. tmpref.base:=NR_R15;
  4605. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  4606. { in case of LDF/STF, we got rid of the NR_R15 }
  4607. if is_pc(ref.base) then
  4608. ref.base:=NR_NO;
  4609. if is_pc(ref.index) then
  4610. ref.index:=NR_NO;
  4611. end
  4612. else
  4613. a_load_const_reg(list,OS_ADDR,ref.offset,tmpreg);
  4614. if (ref.base<>NR_NO) then
  4615. begin
  4616. if ref.index<>NR_NO then
  4617. begin
  4618. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4619. ref.base:=tmpreg;
  4620. end
  4621. else
  4622. begin
  4623. ref.index:=tmpreg;
  4624. ref.shiftimm:=0;
  4625. ref.signindex:=1;
  4626. ref.shiftmode:=SM_None;
  4627. end;
  4628. end
  4629. else
  4630. ref.base:=tmpreg;
  4631. ref.offset:=0;
  4632. ref.symbol:=nil;
  4633. end;
  4634. if (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  4635. begin
  4636. if tmpreg<>NR_NO then
  4637. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg,tmpreg)
  4638. else
  4639. begin
  4640. tmpreg:=getintregister(list,OS_ADDR);
  4641. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg);
  4642. ref.base:=tmpreg;
  4643. end;
  4644. ref.offset:=0;
  4645. end;
  4646. { Hack? Thumb2 doesn't allow PC indexed addressing modes(although it does in the specification) }
  4647. if (ref.base=NR_R15) and (ref.index<>NR_NO) and (ref.shiftmode <> sm_none) then
  4648. begin
  4649. tmpreg:=getintregister(list,OS_ADDR);
  4650. list.concat(taicpu.op_reg_reg(A_MOV, tmpreg, NR_R15));
  4651. ref.base := tmpreg;
  4652. end;
  4653. { floating point operations have only limited references
  4654. we expect here, that a base is already set }
  4655. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  4656. begin
  4657. if ref.shiftmode<>SM_none then
  4658. internalerror(200309121);
  4659. if tmpreg<>NR_NO then
  4660. begin
  4661. if ref.base=tmpreg then
  4662. begin
  4663. if ref.signindex<0 then
  4664. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,tmpreg,ref.index))
  4665. else
  4666. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,tmpreg,ref.index));
  4667. ref.index:=NR_NO;
  4668. end
  4669. else
  4670. begin
  4671. if ref.index<>tmpreg then
  4672. internalerror(200403161);
  4673. if ref.signindex<0 then
  4674. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,ref.base,tmpreg))
  4675. else
  4676. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4677. ref.base:=tmpreg;
  4678. ref.index:=NR_NO;
  4679. end;
  4680. end
  4681. else
  4682. begin
  4683. tmpreg:=getintregister(list,OS_ADDR);
  4684. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));
  4685. ref.base:=tmpreg;
  4686. ref.index:=NR_NO;
  4687. end;
  4688. end;
  4689. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  4690. Result := ref;
  4691. end;
  4692. procedure tthumb2cgarm.a_loadmm_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister; shuffle: pmmshuffle);
  4693. var
  4694. instr: taicpu;
  4695. begin
  4696. if (fromsize=OS_F32) and
  4697. (tosize=OS_F32) then
  4698. begin
  4699. instr:=setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32);
  4700. list.Concat(instr);
  4701. add_move_instruction(instr);
  4702. end
  4703. else if (fromsize=OS_F64) and
  4704. (tosize=OS_F64) then
  4705. begin
  4706. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,tregister(longint(reg2)+1),tregister(longint(reg1)+1)), PF_F32));
  4707. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32));
  4708. end
  4709. else if (fromsize=OS_F32) and
  4710. (tosize=OS_F64) then
  4711. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VCVT,reg2,reg1), PF_F32))
  4712. begin
  4713. //list.concat(nil);
  4714. end;
  4715. end;
  4716. procedure tthumb2cgarm.a_loadmm_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  4717. begin
  4718. handle_load_store(list,A_VLDR,PF_None,reg,ref);
  4719. end;
  4720. procedure tthumb2cgarm.a_loadmm_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  4721. begin
  4722. handle_load_store(list,A_VSTR,PF_None,reg,ref);
  4723. end;
  4724. procedure tthumb2cgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize: tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  4725. begin
  4726. if //(shuffle=nil) and
  4727. (tosize=OS_F32) then
  4728. list.Concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg))
  4729. else
  4730. internalerror(2012100813);
  4731. end;
  4732. procedure tthumb2cgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize: tcgsize; mmreg, intreg: tregister; shuffle: pmmshuffle);
  4733. begin
  4734. if //(shuffle=nil) and
  4735. (fromsize=OS_F32) then
  4736. list.Concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg))
  4737. else
  4738. internalerror(2012100814);
  4739. end;
  4740. procedure tthumb2cg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  4741. var tmpreg: tregister;
  4742. begin
  4743. case op of
  4744. OP_NEG:
  4745. begin
  4746. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4747. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  4748. tmpreg:=cg.getintregister(list,OS_32);
  4749. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,0));
  4750. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,tmpreg,regsrc.reghi));
  4751. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4752. end;
  4753. else
  4754. inherited a_op64_reg_reg(list, op, size, regsrc, regdst);
  4755. end;
  4756. end;
  4757. procedure tthumbcg64farm.a_op64_reg_reg(list: TAsmList; op: TOpCG; size: tcgsize; regsrc, regdst: tregister64);
  4758. begin
  4759. case op of
  4760. OP_NEG:
  4761. begin
  4762. list.concat(taicpu.op_reg_const(A_MOV,regdst.reglo,0));
  4763. list.concat(taicpu.op_reg_const(A_MOV,regdst.reghi,0));
  4764. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4765. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4766. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4767. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4768. end;
  4769. OP_NOT:
  4770. begin
  4771. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  4772. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  4773. end;
  4774. OP_AND,OP_OR,OP_XOR:
  4775. begin
  4776. cg.a_op_reg_reg(list,op,OS_32,regsrc.reglo,regdst.reglo);
  4777. cg.a_op_reg_reg(list,op,OS_32,regsrc.reghi,regdst.reghi);
  4778. end;
  4779. OP_ADD:
  4780. begin
  4781. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4782. list.concat(taicpu.op_reg_reg(A_ADD,regdst.reglo,regsrc.reglo));
  4783. list.concat(taicpu.op_reg_reg(A_ADC,regdst.reghi,regsrc.reghi));
  4784. end;
  4785. OP_SUB:
  4786. begin
  4787. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4788. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4789. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4790. end;
  4791. else
  4792. internalerror(2003083101);
  4793. end;
  4794. end;
  4795. procedure tthumbcg64farm.a_op64_const_reg(list: TAsmList; op: TOpCG; size: tcgsize; value: int64; reg: tregister64);
  4796. var
  4797. tmpreg : tregister;
  4798. b : byte;
  4799. begin
  4800. case op of
  4801. OP_AND,OP_OR,OP_XOR:
  4802. begin
  4803. cg.a_op_const_reg(list,op,OS_32,aint(lo(value)),reg.reglo);
  4804. cg.a_op_const_reg(list,op,OS_32,aint(hi(value)),reg.reghi);
  4805. end;
  4806. OP_ADD:
  4807. begin
  4808. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4809. begin
  4810. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4811. list.concat(taicpu.op_reg_const(A_ADD,reg.reglo,aint(lo(value))));
  4812. end
  4813. else
  4814. begin
  4815. tmpreg:=cg.getintregister(list,OS_32);
  4816. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4817. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4818. list.concat(taicpu.op_reg_reg(A_ADD,reg.reglo,tmpreg));
  4819. end;
  4820. tmpreg:=cg.getintregister(list,OS_32);
  4821. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  4822. list.concat(taicpu.op_reg_reg(A_ADC,reg.reghi,tmpreg));
  4823. end;
  4824. OP_SUB:
  4825. begin
  4826. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4827. begin
  4828. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4829. list.concat(taicpu.op_reg_const(A_SUB,reg.reglo,aint(lo(value))))
  4830. end
  4831. else
  4832. begin
  4833. tmpreg:=cg.getintregister(list,OS_32);
  4834. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4835. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4836. list.concat(taicpu.op_reg_reg(A_SUB,reg.reglo,tmpreg));
  4837. end;
  4838. tmpreg:=cg.getintregister(list,OS_32);
  4839. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  4840. list.concat(taicpu.op_reg_reg(A_SBC,reg.reghi,tmpreg));
  4841. end;
  4842. else
  4843. internalerror(2003083101);
  4844. end;
  4845. end;
  4846. procedure create_codegen;
  4847. begin
  4848. if GenerateThumb2Code then
  4849. begin
  4850. cg:=tthumb2cgarm.create;
  4851. cg64:=tthumb2cg64farm.create;
  4852. casmoptimizer:=TCpuThumb2AsmOptimizer;
  4853. end
  4854. else if GenerateThumbCode then
  4855. begin
  4856. cg:=tthumbcgarm.create;
  4857. cg64:=tthumbcg64farm.create;
  4858. // casmoptimizer:=TCpuThumbAsmOptimizer;
  4859. end
  4860. else
  4861. begin
  4862. cg:=tarmcgarm.create;
  4863. cg64:=tarmcg64farm.create;
  4864. casmoptimizer:=TCpuAsmOptimizer;
  4865. end;
  4866. end;
  4867. end.