cgcpu.pas 214 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228322932303231323232333234323532363237323832393240324132423243324432453246324732483249325032513252325332543255325632573258325932603261326232633264326532663267326832693270327132723273327432753276327732783279328032813282328332843285328632873288328932903291329232933294329532963297329832993300330133023303330433053306330733083309331033113312331333143315331633173318331933203321332233233324332533263327332833293330333133323333333433353336333733383339334033413342334333443345334633473348334933503351335233533354335533563357335833593360336133623363336433653366336733683369337033713372337333743375337633773378337933803381338233833384338533863387338833893390339133923393339433953396339733983399340034013402340334043405340634073408340934103411341234133414341534163417341834193420342134223423342434253426342734283429343034313432343334343435343634373438343934403441344234433444344534463447344834493450345134523453345434553456345734583459346034613462346334643465346634673468346934703471347234733474347534763477347834793480348134823483348434853486348734883489349034913492349334943495349634973498349935003501350235033504350535063507350835093510351135123513351435153516351735183519352035213522352335243525352635273528352935303531353235333534353535363537353835393540354135423543354435453546354735483549355035513552355335543555355635573558355935603561356235633564356535663567356835693570357135723573357435753576357735783579358035813582358335843585358635873588358935903591359235933594359535963597359835993600360136023603360436053606360736083609361036113612361336143615361636173618361936203621362236233624362536263627362836293630363136323633363436353636363736383639364036413642364336443645364636473648364936503651365236533654365536563657365836593660366136623663366436653666366736683669367036713672367336743675367636773678367936803681368236833684368536863687368836893690369136923693369436953696369736983699370037013702370337043705370637073708370937103711371237133714371537163717371837193720372137223723372437253726372737283729373037313732373337343735373637373738373937403741374237433744374537463747374837493750375137523753375437553756375737583759376037613762376337643765376637673768376937703771377237733774377537763777377837793780378137823783378437853786378737883789379037913792379337943795379637973798379938003801380238033804380538063807380838093810381138123813381438153816381738183819382038213822382338243825382638273828382938303831383238333834383538363837383838393840384138423843384438453846384738483849385038513852385338543855385638573858385938603861386238633864386538663867386838693870387138723873387438753876387738783879388038813882388338843885388638873888388938903891389238933894389538963897389838993900390139023903390439053906390739083909391039113912391339143915391639173918391939203921392239233924392539263927392839293930393139323933393439353936393739383939394039413942394339443945394639473948394939503951395239533954395539563957395839593960396139623963396439653966396739683969397039713972397339743975397639773978397939803981398239833984398539863987398839893990399139923993399439953996399739983999400040014002400340044005400640074008400940104011401240134014401540164017401840194020402140224023402440254026402740284029403040314032403340344035403640374038403940404041404240434044404540464047404840494050405140524053405440554056405740584059406040614062406340644065406640674068406940704071407240734074407540764077407840794080408140824083408440854086408740884089409040914092409340944095409640974098409941004101410241034104410541064107410841094110411141124113411441154116411741184119412041214122412341244125412641274128412941304131413241334134413541364137413841394140414141424143414441454146414741484149415041514152415341544155415641574158415941604161416241634164416541664167416841694170417141724173417441754176417741784179418041814182418341844185418641874188418941904191419241934194419541964197419841994200420142024203420442054206420742084209421042114212421342144215421642174218421942204221422242234224422542264227422842294230423142324233423442354236423742384239424042414242424342444245424642474248424942504251425242534254425542564257425842594260426142624263426442654266426742684269427042714272427342744275427642774278427942804281428242834284428542864287428842894290429142924293429442954296429742984299430043014302430343044305430643074308430943104311431243134314431543164317431843194320432143224323432443254326432743284329433043314332433343344335433643374338433943404341434243434344434543464347434843494350435143524353435443554356435743584359436043614362436343644365436643674368436943704371437243734374437543764377437843794380438143824383438443854386438743884389439043914392439343944395439643974398439944004401440244034404440544064407440844094410441144124413441444154416441744184419442044214422442344244425442644274428442944304431443244334434443544364437443844394440444144424443444444454446444744484449445044514452445344544455445644574458445944604461446244634464446544664467446844694470447144724473447444754476447744784479448044814482448344844485448644874488448944904491449244934494449544964497449844994500450145024503450445054506450745084509451045114512451345144515451645174518451945204521452245234524452545264527452845294530453145324533453445354536453745384539454045414542454345444545454645474548454945504551455245534554455545564557455845594560456145624563456445654566456745684569457045714572457345744575457645774578457945804581458245834584458545864587458845894590459145924593459445954596459745984599460046014602460346044605460646074608460946104611461246134614461546164617461846194620462146224623462446254626462746284629463046314632463346344635463646374638463946404641464246434644464546464647464846494650465146524653465446554656465746584659466046614662466346644665466646674668466946704671467246734674467546764677467846794680468146824683468446854686468746884689469046914692469346944695469646974698469947004701470247034704470547064707470847094710471147124713471447154716471747184719472047214722472347244725472647274728472947304731473247334734473547364737473847394740474147424743474447454746474747484749475047514752475347544755475647574758475947604761476247634764476547664767476847694770477147724773477447754776477747784779478047814782478347844785478647874788478947904791479247934794479547964797479847994800480148024803480448054806480748084809481048114812481348144815481648174818481948204821482248234824482548264827482848294830483148324833483448354836483748384839484048414842484348444845484648474848484948504851485248534854485548564857485848594860486148624863486448654866486748684869487048714872487348744875487648774878487948804881488248834884488548864887488848894890489148924893489448954896489748984899490049014902490349044905490649074908490949104911491249134914491549164917491849194920492149224923492449254926492749284929493049314932493349344935493649374938493949404941494249434944494549464947494849494950495149524953495449554956495749584959496049614962496349644965496649674968496949704971497249734974497549764977497849794980498149824983498449854986498749884989499049914992499349944995499649974998499950005001500250035004500550065007500850095010501150125013501450155016501750185019502050215022502350245025502650275028502950305031503250335034503550365037503850395040504150425043504450455046504750485049505050515052505350545055505650575058505950605061506250635064506550665067506850695070507150725073507450755076507750785079508050815082508350845085508650875088508950905091509250935094509550965097509850995100510151025103510451055106510751085109511051115112511351145115511651175118511951205121512251235124512551265127512851295130513151325133513451355136513751385139514051415142514351445145514651475148514951505151515251535154515551565157515851595160516151625163516451655166516751685169517051715172517351745175517651775178517951805181518251835184518551865187518851895190519151925193519451955196519751985199520052015202520352045205520652075208520952105211521252135214521552165217521852195220522152225223522452255226522752285229523052315232523352345235523652375238523952405241524252435244524552465247524852495250525152525253525452555256525752585259526052615262526352645265526652675268526952705271527252735274527552765277527852795280528152825283528452855286528752885289529052915292529352945295529652975298529953005301530253035304530553065307530853095310531153125313531453155316531753185319532053215322
  1. {
  2. Copyright (c) 2003 by Florian Klaempfl
  3. Member of the Free Pascal development team
  4. This unit implements the code generator for the ARM
  5. This program is free software; you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation; either version 2 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program; if not, write to the Free Software
  15. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  16. ****************************************************************************
  17. }
  18. unit cgcpu;
  19. {$i fpcdefs.inc}
  20. interface
  21. uses
  22. globtype,symtype,symdef,
  23. cgbase,cgutils,cgobj,
  24. aasmbase,aasmcpu,aasmtai,aasmdata,
  25. parabase,
  26. cpubase,cpuinfo,cg64f32,rgcpu;
  27. type
  28. { tbasecgarm is shared between all arm architectures }
  29. tbasecgarm = class(tcg)
  30. { true, if the next arithmetic operation should modify the flags }
  31. cgsetflags : boolean;
  32. procedure a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);override;
  33. procedure a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);override;
  34. procedure a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);override;
  35. procedure a_call_name(list : TAsmList;const s : string; weak: boolean);override;
  36. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  37. { move instructions }
  38. procedure a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);override;
  39. procedure a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);override;
  40. function a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  41. function a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  42. { fpu move instructions }
  43. procedure a_loadfpu_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister); override;
  44. procedure a_loadfpu_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister); override;
  45. procedure a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference); override;
  46. procedure a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);override;
  47. { comparison operations }
  48. procedure a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  49. l : tasmlabel);override;
  50. procedure a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel); override;
  51. procedure a_jmp_name(list : TAsmList;const s : string); override;
  52. procedure a_jmp_always(list : TAsmList;l: tasmlabel); override;
  53. procedure a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel); override;
  54. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  55. procedure g_profilecode(list : TAsmList); override;
  56. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  57. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  58. procedure g_maybe_got_init(list : TAsmList); override;
  59. procedure a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);override;
  60. procedure g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);override;
  61. procedure g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);override;
  62. procedure g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  63. procedure g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  64. procedure g_overflowcheck(list: TAsmList; const l: tlocation; def: tdef); override;
  65. procedure g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);override;
  66. procedure g_save_registers(list : TAsmList);override;
  67. procedure g_restore_registers(list : TAsmList);override;
  68. procedure a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  69. procedure fixref(list : TAsmList;var ref : treference);
  70. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; virtual;
  71. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  72. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  73. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  74. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  75. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  76. procedure a_opmm_reg_reg(list: TAsmList; Op: TOpCG; size : tcgsize;src,dst: tregister;shuffle : pmmshuffle); override;
  77. { Transform unsupported methods into Internal errors }
  78. procedure a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister); override;
  79. { try to generate optimized 32 Bit multiplication, returns true if successful generated }
  80. function try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  81. { clear out potential overflow bits from 8 or 16 bit operations }
  82. { the upper 24/16 bits of a register after an operation }
  83. procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  84. { mla for thumb requires that none of the registers is equal to r13/r15, this method ensures this }
  85. procedure safe_mla(list: TAsmList;op1,op2,op3,op4 : TRegister);
  86. end;
  87. { tcgarm is shared between normal arm and thumb-2 }
  88. tcgarm = class(tbasecgarm)
  89. procedure a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister); override;
  90. procedure a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference); override;
  91. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  92. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  93. size: tcgsize; a: tcgint; src, dst: tregister); override;
  94. procedure a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  95. size: tcgsize; src1, src2, dst: tregister); override;
  96. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  97. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  98. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  99. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  100. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  101. {Multiply two 32-bit registers into lo and hi 32-bit registers}
  102. procedure a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister); override;
  103. end;
  104. { normal arm cg }
  105. tarmcgarm = class(tcgarm)
  106. procedure init_register_allocators;override;
  107. procedure done_register_allocators;override;
  108. end;
  109. { 64 bit cg for all arm flavours }
  110. tbasecg64farm = class(tcg64f32)
  111. end;
  112. { tcg64farm is shared between normal arm and thumb-2 }
  113. tcg64farm = class(tbasecg64farm)
  114. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  115. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  116. procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;
  117. procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  118. procedure a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  119. procedure a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  120. procedure a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);override;
  121. procedure a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);override;
  122. end;
  123. tarmcg64farm = class(tcg64farm)
  124. end;
  125. tthumbcgarm = class(tbasecgarm)
  126. procedure init_register_allocators;override;
  127. procedure done_register_allocators;override;
  128. procedure g_proc_entry(list: TAsmList; localsize: longint; nostackframe: boolean);override;
  129. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  130. procedure a_op_reg_reg(list: TAsmList; Op: TOpCG; size: TCGSize; src,dst: TRegister);override;
  131. procedure a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);override;
  132. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister); override;
  133. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  134. procedure a_load_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const Ref: treference; reg: tregister);override;
  135. procedure a_load_const_reg(list: TAsmList; size: tcgsize; a: tcgint; reg: tregister);override;
  136. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  137. function handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference; override;
  138. end;
  139. tthumbcg64farm = class(tbasecg64farm)
  140. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  141. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  142. end;
  143. tthumb2cgarm = class(tcgarm)
  144. procedure init_register_allocators;override;
  145. procedure done_register_allocators;override;
  146. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  147. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  148. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  149. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  150. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  151. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  152. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  153. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  154. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  155. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; override;
  156. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  157. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  158. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  159. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  160. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  161. end;
  162. tthumb2cg64farm = class(tcg64farm)
  163. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  164. end;
  165. const
  166. OpCmp2AsmCond : Array[topcmp] of TAsmCond = (C_NONE,C_EQ,C_GT,
  167. C_LT,C_GE,C_LE,C_NE,C_LS,C_CC,C_CS,C_HI);
  168. winstackpagesize = 4096;
  169. function get_fpu_postfix(def : tdef) : toppostfix;
  170. procedure create_codegen;
  171. implementation
  172. uses
  173. globals,verbose,systems,cutils,
  174. aopt,aoptcpu,
  175. fmodule,
  176. symconst,symsym,symtable,
  177. tgobj,
  178. procinfo,cpupi,
  179. paramgr;
  180. function get_fpu_postfix(def : tdef) : toppostfix;
  181. begin
  182. if def.typ=floatdef then
  183. begin
  184. case tfloatdef(def).floattype of
  185. s32real:
  186. result:=PF_S;
  187. s64real:
  188. result:=PF_D;
  189. s80real:
  190. result:=PF_E;
  191. else
  192. internalerror(200401272);
  193. end;
  194. end
  195. else
  196. internalerror(200401271);
  197. end;
  198. procedure tarmcgarm.init_register_allocators;
  199. begin
  200. inherited init_register_allocators;
  201. { currently, we always save R14, so we can use it }
  202. if (target_info.system<>system_arm_darwin) then
  203. begin
  204. if assigned(current_procinfo) and (current_procinfo.framepointer<>NR_R11) then
  205. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  206. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  207. RS_R9,RS_R10,RS_R11,RS_R14],first_int_imreg,[])
  208. else
  209. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  210. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  211. RS_R9,RS_R10,RS_R14],first_int_imreg,[])
  212. end
  213. else
  214. { r7 is not available on Darwin, it's used as frame pointer (always,
  215. for backtrace support -- also in gcc/clang -> R11 can be used).
  216. r9 is volatile }
  217. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  218. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R9,RS_R12,RS_R4,RS_R5,RS_R6,RS_R8,
  219. RS_R10,RS_R11,RS_R14],first_int_imreg,[]);
  220. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  221. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  222. { The register allocator currently cannot deal with multiple
  223. non-overlapping subregs per register, so we can only use
  224. half the single precision registers for now (as sub registers of the
  225. double precision ones). }
  226. if current_settings.fputype in [fpu_vfpv3,fpu_vfpv4] then
  227. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  228. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  229. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  230. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  231. ],first_mm_imreg,[])
  232. else
  233. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  234. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15],first_mm_imreg,[]);
  235. end;
  236. procedure tarmcgarm.done_register_allocators;
  237. begin
  238. rg[R_INTREGISTER].free;
  239. rg[R_FPUREGISTER].free;
  240. rg[R_MMREGISTER].free;
  241. inherited done_register_allocators;
  242. end;
  243. procedure tcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  244. var
  245. imm_shift : byte;
  246. l : tasmlabel;
  247. hr : treference;
  248. imm1, imm2: DWord;
  249. begin
  250. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  251. internalerror(2002090902);
  252. if is_shifter_const(a,imm_shift) then
  253. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  254. else if is_shifter_const(not(a),imm_shift) then
  255. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  256. { loading of constants with mov and orr }
  257. else if (split_into_shifter_const(a,imm1, imm2)) then
  258. begin
  259. list.concat(taicpu.op_reg_const(A_MOV,reg, imm1));
  260. list.concat(taicpu.op_reg_reg_const(A_ORR,reg,reg, imm2));
  261. end
  262. { loading of constants with mvn and bic }
  263. else if (split_into_shifter_const(not(a), imm1, imm2)) then
  264. begin
  265. list.concat(taicpu.op_reg_const(A_MVN,reg, imm1));
  266. list.concat(taicpu.op_reg_reg_const(A_BIC,reg,reg, imm2));
  267. end
  268. else
  269. begin
  270. reference_reset(hr,4,[]);
  271. current_asmdata.getjumplabel(l);
  272. cg.a_label(current_procinfo.aktlocaldata,l);
  273. hr.symboldata:=current_procinfo.aktlocaldata.last;
  274. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  275. hr.symbol:=l;
  276. hr.base:=NR_PC;
  277. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  278. end;
  279. end;
  280. procedure tcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  281. var
  282. oppostfix:toppostfix;
  283. usedtmpref: treference;
  284. tmpreg,tmpreg2 : tregister;
  285. so : tshifterop;
  286. dir : integer;
  287. begin
  288. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  289. FromSize := ToSize;
  290. case FromSize of
  291. { signed integer registers }
  292. OS_8:
  293. oppostfix:=PF_B;
  294. OS_S8:
  295. oppostfix:=PF_SB;
  296. OS_16:
  297. oppostfix:=PF_H;
  298. OS_S16:
  299. oppostfix:=PF_SH;
  300. OS_32,
  301. OS_S32:
  302. oppostfix:=PF_None;
  303. else
  304. InternalError(200308297);
  305. end;
  306. if (fromsize=OS_S8) and
  307. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  308. oppostfix:=PF_B;
  309. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize])) or
  310. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  311. (oppostfix in [PF_SH,PF_H])) then
  312. begin
  313. if target_info.endian=endian_big then
  314. dir:=-1
  315. else
  316. dir:=1;
  317. case FromSize of
  318. OS_16,OS_S16:
  319. begin
  320. { only complicated references need an extra loadaddr }
  321. if assigned(ref.symbol) or
  322. (ref.index<>NR_NO) or
  323. (ref.offset<-4095) or
  324. (ref.offset>4094) or
  325. { sometimes the compiler reused registers }
  326. (reg=ref.index) or
  327. (reg=ref.base) then
  328. begin
  329. tmpreg2:=getintregister(list,OS_INT);
  330. a_loadaddr_ref_reg(list,ref,tmpreg2);
  331. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment,ref.volatility);
  332. end
  333. else
  334. usedtmpref:=ref;
  335. if target_info.endian=endian_big then
  336. inc(usedtmpref.offset,1);
  337. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  338. tmpreg:=getintregister(list,OS_INT);
  339. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  340. inc(usedtmpref.offset,dir);
  341. if FromSize=OS_16 then
  342. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  343. else
  344. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  345. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  346. end;
  347. OS_32,OS_S32:
  348. begin
  349. tmpreg:=getintregister(list,OS_INT);
  350. { only complicated references need an extra loadaddr }
  351. if assigned(ref.symbol) or
  352. (ref.index<>NR_NO) or
  353. (ref.offset<-4095) or
  354. (ref.offset>4092) or
  355. { sometimes the compiler reused registers }
  356. (reg=ref.index) or
  357. (reg=ref.base) then
  358. begin
  359. tmpreg2:=getintregister(list,OS_INT);
  360. a_loadaddr_ref_reg(list,ref,tmpreg2);
  361. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment,ref.volatility);
  362. end
  363. else
  364. usedtmpref:=ref;
  365. shifterop_reset(so);so.shiftmode:=SM_LSL;
  366. if ref.alignment=2 then
  367. begin
  368. if target_info.endian=endian_big then
  369. inc(usedtmpref.offset,2);
  370. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  371. inc(usedtmpref.offset,dir*2);
  372. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  373. so.shiftimm:=16;
  374. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  375. end
  376. else
  377. begin
  378. tmpreg2:=getintregister(list,OS_INT);
  379. if target_info.endian=endian_big then
  380. inc(usedtmpref.offset,3);
  381. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  382. inc(usedtmpref.offset,dir);
  383. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  384. inc(usedtmpref.offset,dir);
  385. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg2);
  386. so.shiftimm:=8;
  387. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  388. inc(usedtmpref.offset,dir);
  389. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  390. so.shiftimm:=16;
  391. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg2,so));
  392. so.shiftimm:=24;
  393. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  394. end;
  395. end
  396. else
  397. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  398. end;
  399. end
  400. else
  401. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  402. if (fromsize=OS_S8) and
  403. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  404. a_load_reg_reg(list,OS_S8,OS_32,reg,reg)
  405. else if (fromsize=OS_S8) and (tosize = OS_16) then
  406. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  407. end;
  408. procedure tcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  409. var
  410. hsym : tsym;
  411. href : treference;
  412. paraloc : Pcgparalocation;
  413. shift : byte;
  414. begin
  415. { calculate the parameter info for the procdef }
  416. procdef.init_paraloc_info(callerside);
  417. hsym:=tsym(procdef.parast.Find('self'));
  418. if not(assigned(hsym) and
  419. (hsym.typ=paravarsym)) then
  420. internalerror(200305251);
  421. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  422. while paraloc<>nil do
  423. with paraloc^ do
  424. begin
  425. case loc of
  426. LOC_REGISTER:
  427. begin
  428. if is_shifter_const(ioffset,shift) then
  429. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  430. else
  431. begin
  432. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  433. a_op_reg_reg(list,OP_SUB,size,NR_R12,register);
  434. end;
  435. end;
  436. LOC_REFERENCE:
  437. begin
  438. { offset in the wrapper needs to be adjusted for the stored
  439. return address }
  440. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),sizeof(pint),[]);
  441. if is_shifter_const(ioffset,shift) then
  442. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  443. else
  444. begin
  445. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  446. a_op_reg_ref(list,OP_SUB,size,NR_R12,href);
  447. end;
  448. end
  449. else
  450. internalerror(200309189);
  451. end;
  452. paraloc:=next;
  453. end;
  454. end;
  455. procedure tbasecgarm.a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);
  456. var
  457. ref: treference;
  458. begin
  459. paraloc.check_simple_location;
  460. paramanager.allocparaloc(list,paraloc.location);
  461. case paraloc.location^.loc of
  462. LOC_REGISTER,LOC_CREGISTER:
  463. a_load_const_reg(list,size,a,paraloc.location^.register);
  464. LOC_REFERENCE:
  465. begin
  466. reference_reset(ref,paraloc.alignment,[]);
  467. ref.base:=paraloc.location^.reference.index;
  468. ref.offset:=paraloc.location^.reference.offset;
  469. a_load_const_ref(list,size,a,ref);
  470. end;
  471. else
  472. internalerror(2002081101);
  473. end;
  474. end;
  475. procedure tbasecgarm.a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);
  476. var
  477. tmpref, ref: treference;
  478. location: pcgparalocation;
  479. sizeleft: aint;
  480. begin
  481. location := paraloc.location;
  482. tmpref := r;
  483. sizeleft := paraloc.intsize;
  484. while assigned(location) do
  485. begin
  486. paramanager.allocparaloc(list,location);
  487. case location^.loc of
  488. LOC_REGISTER,LOC_CREGISTER:
  489. a_load_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  490. LOC_REFERENCE:
  491. begin
  492. reference_reset_base(ref,location^.reference.index,location^.reference.offset,paraloc.alignment,[]);
  493. { doubles in softemu mode have a strange order of registers and references }
  494. if location^.size=OS_32 then
  495. g_concatcopy(list,tmpref,ref,4)
  496. else
  497. begin
  498. g_concatcopy(list,tmpref,ref,sizeleft);
  499. if assigned(location^.next) then
  500. internalerror(2005010710);
  501. end;
  502. end;
  503. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  504. case location^.size of
  505. OS_F32, OS_F64:
  506. a_loadfpu_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  507. else
  508. internalerror(2002072801);
  509. end;
  510. LOC_VOID:
  511. begin
  512. // nothing to do
  513. end;
  514. else
  515. internalerror(2002081103);
  516. end;
  517. inc(tmpref.offset,tcgsize2size[location^.size]);
  518. dec(sizeleft,tcgsize2size[location^.size]);
  519. location := location^.next;
  520. end;
  521. end;
  522. procedure tbasecgarm.a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);
  523. var
  524. ref: treference;
  525. tmpreg: tregister;
  526. begin
  527. paraloc.check_simple_location;
  528. paramanager.allocparaloc(list,paraloc.location);
  529. case paraloc.location^.loc of
  530. LOC_REGISTER,LOC_CREGISTER:
  531. a_loadaddr_ref_reg(list,r,paraloc.location^.register);
  532. LOC_REFERENCE:
  533. begin
  534. reference_reset(ref,paraloc.alignment,[]);
  535. ref.base := paraloc.location^.reference.index;
  536. ref.offset := paraloc.location^.reference.offset;
  537. tmpreg := getintregister(list,OS_ADDR);
  538. a_loadaddr_ref_reg(list,r,tmpreg);
  539. a_load_reg_ref(list,OS_ADDR,OS_ADDR,tmpreg,ref);
  540. end;
  541. else
  542. internalerror(2002080701);
  543. end;
  544. end;
  545. procedure tbasecgarm.a_call_name(list : TAsmList;const s : string; weak: boolean);
  546. var
  547. branchopcode: tasmop;
  548. r : treference;
  549. sym : TAsmSymbol;
  550. begin
  551. { use always BL as newer binutils do not translate blx apparently
  552. generating BL is also what clang and gcc do by default }
  553. branchopcode:=A_BL;
  554. if not(weak) then
  555. sym:=current_asmdata.RefAsmSymbol(s,AT_FUNCTION)
  556. else
  557. sym:=current_asmdata.WeakRefAsmSymbol(s,AT_FUNCTION);
  558. reference_reset_symbol(r,sym,0,sizeof(pint),[]);
  559. if (tf_pic_uses_got in target_info.flags) and
  560. (cs_create_pic in current_settings.moduleswitches) then
  561. begin
  562. r.refaddr:=addr_pic
  563. end
  564. else
  565. r.refaddr:=addr_full;
  566. list.concat(taicpu.op_ref(branchopcode,r));
  567. {
  568. the compiler does not properly set this flag anymore in pass 1, and
  569. for now we only need it after pass 2 (I hope) (JM)
  570. if not(pi_do_call in current_procinfo.flags) then
  571. internalerror(2003060703);
  572. }
  573. include(current_procinfo.flags,pi_do_call);
  574. end;
  575. procedure tbasecgarm.a_call_reg(list : TAsmList;reg: tregister);
  576. begin
  577. { check not really correct: should only be used for non-Thumb cpus }
  578. if not(CPUARM_HAS_BLX in cpu_capabilities[current_settings.cputype]) then
  579. begin
  580. list.concat(taicpu.op_reg_reg(A_MOV,NR_R14,NR_PC));
  581. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,reg));
  582. end
  583. else
  584. list.concat(taicpu.op_reg(A_BLX, reg));
  585. {
  586. the compiler does not properly set this flag anymore in pass 1, and
  587. for now we only need it after pass 2 (I hope) (JM)
  588. if not(pi_do_call in current_procinfo.flags) then
  589. internalerror(2003060703);
  590. }
  591. include(current_procinfo.flags,pi_do_call);
  592. end;
  593. procedure tcgarm.a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister);
  594. begin
  595. a_op_const_reg_reg(list,op,size,a,reg,reg);
  596. end;
  597. procedure tcgarm.a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference);
  598. var
  599. tmpreg,tmpresreg : tregister;
  600. tmpref : treference;
  601. begin
  602. tmpreg:=getintregister(list,size);
  603. tmpresreg:=getintregister(list,size);
  604. tmpref:=a_internal_load_ref_reg(list,size,size,ref,tmpreg);
  605. a_op_const_reg_reg(list,op,size,a,tmpreg,tmpresreg);
  606. a_load_reg_ref(list,size,size,tmpresreg,tmpref);
  607. end;
  608. procedure tcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  609. var
  610. so : tshifterop;
  611. begin
  612. if op = OP_NEG then
  613. begin
  614. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,src,0));
  615. maybeadjustresult(list,OP_NEG,size,dst);
  616. end
  617. else if op = OP_NOT then
  618. begin
  619. if size in [OS_8, OS_16, OS_S8, OS_S16] then
  620. begin
  621. shifterop_reset(so);
  622. so.shiftmode:=SM_LSL;
  623. if size in [OS_8, OS_S8] then
  624. so.shiftimm:=24
  625. else
  626. so.shiftimm:=16;
  627. list.concat(taicpu.op_reg_reg_shifterop(A_MVN,dst,src,so));
  628. {Using a shift here allows this to be folded into another instruction}
  629. if size in [OS_S8, OS_S16] then
  630. so.shiftmode:=SM_ASR
  631. else
  632. so.shiftmode:=SM_LSR;
  633. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  634. end
  635. else
  636. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  637. end
  638. else
  639. a_op_reg_reg_reg(list,op,size,src,dst,dst);
  640. end;
  641. const
  642. op_reg_reg_opcg2asmop: array[TOpCG] of tasmop =
  643. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  644. A_NONE,A_NONE,A_NONE,A_SUB,A_EOR,A_NONE,A_NONE);
  645. op_reg_opcg2asmop: array[TOpCG] of tasmop =
  646. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  647. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  648. op_reg_postfix: array[TOpCG] of TOpPostfix =
  649. (PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,
  650. PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None);
  651. procedure tcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  652. size: tcgsize; a: tcgint; src, dst: tregister);
  653. var
  654. ovloc : tlocation;
  655. begin
  656. a_op_const_reg_reg_checkoverflow(list,op,size,a,src,dst,false,ovloc);
  657. end;
  658. procedure tcgarm.a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  659. size: tcgsize; src1, src2, dst: tregister);
  660. var
  661. ovloc : tlocation;
  662. begin
  663. a_op_reg_reg_reg_checkoverflow(list,op,size,src1,src2,dst,false,ovloc);
  664. end;
  665. function opshift2shiftmode(op: TOpCg): tshiftmode;
  666. begin
  667. case op of
  668. OP_SHL: Result:=SM_LSL;
  669. OP_SHR: Result:=SM_LSR;
  670. OP_ROR: Result:=SM_ROR;
  671. OP_ROL: Result:=SM_ROR;
  672. OP_SAR: Result:=SM_ASR;
  673. else internalerror(2012070501);
  674. end
  675. end;
  676. function tbasecgarm.try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  677. var
  678. multiplier : dword;
  679. power : longint;
  680. shifterop : tshifterop;
  681. bitsset : byte;
  682. negative : boolean;
  683. first : boolean;
  684. b,
  685. cycles : byte;
  686. maxeffort : byte;
  687. begin
  688. result:=true;
  689. cycles:=0;
  690. negative:=a<0;
  691. shifterop.rs:=NR_NO;
  692. shifterop.shiftmode:=SM_LSL;
  693. if negative then
  694. inc(cycles);
  695. multiplier:=dword(abs(a));
  696. bitsset:=popcnt(multiplier and $fffffffe);
  697. { heuristics to estimate how much instructions are reasonable to replace the mul,
  698. this is currently based on XScale timings }
  699. { in the simplest case, we need a mov to load the constant and a mul to carry out the
  700. actual multiplication, this requires min. 1+4 cycles
  701. because the first shift imm. might cause a stall and because we need more instructions
  702. when replacing the mul we generate max. 3 instructions to replace this mul }
  703. maxeffort:=3;
  704. { if the constant is not a shifter op, we need either some mov/mvn/bic/or sequence or
  705. a ldr, so generating one more operation to replace this is beneficial }
  706. if not(is_shifter_const(dword(a),b)) and not(is_shifter_const(not(dword(a)),b)) then
  707. inc(maxeffort);
  708. { if the upper 5 bits are all set or clear, mul is one cycle faster }
  709. if ((dword(a) and $f8000000)=0) or ((dword(a) and $f8000000)=$f8000000) then
  710. dec(maxeffort);
  711. { if the upper 17 bits are all set or clear, mul is another cycle faster }
  712. if ((dword(a) and $ffff8000)=0) or ((dword(a) and $ffff8000)=$ffff8000) then
  713. dec(maxeffort);
  714. { most simple cases }
  715. if a=1 then
  716. a_load_reg_reg(list,OS_32,OS_32,src,dst)
  717. else if a=0 then
  718. a_load_const_reg(list,OS_32,0,dst)
  719. else if a=-1 then
  720. a_op_reg_reg(list,OP_NEG,OS_32,src,dst)
  721. { add up ?
  722. basically, one add is needed for each bit being set in the constant factor
  723. however, the least significant bit is for free, it can be hidden in the initial
  724. instruction
  725. }
  726. else if (bitsset+cycles<=maxeffort) and
  727. (bitsset<=popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)) then
  728. begin
  729. first:=true;
  730. while multiplier<>0 do
  731. begin
  732. shifterop.shiftimm:=BsrDWord(multiplier);
  733. if odd(multiplier) then
  734. begin
  735. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,shifterop));
  736. dec(multiplier);
  737. end
  738. else
  739. if first then
  740. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  741. else
  742. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,src,shifterop));
  743. first:=false;
  744. dec(multiplier,1 shl shifterop.shiftimm);
  745. end;
  746. if negative then
  747. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  748. end
  749. { subtract from the next greater power of two? }
  750. else if popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)+cycles+1<=maxeffort then
  751. begin
  752. first:=true;
  753. while multiplier<>0 do
  754. begin
  755. if first then
  756. begin
  757. multiplier:=(1 shl power)-multiplier;
  758. shifterop.shiftimm:=power;
  759. end
  760. else
  761. shifterop.shiftimm:=BsrDWord(multiplier);
  762. if odd(multiplier) then
  763. begin
  764. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,shifterop));
  765. dec(multiplier);
  766. end
  767. else
  768. if first then
  769. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  770. else
  771. begin
  772. list.concat(taicpu.op_reg_reg_reg_shifterop(A_SUB,dst,dst,src,shifterop));
  773. dec(multiplier,1 shl shifterop.shiftimm);
  774. end;
  775. first:=false;
  776. end;
  777. if negative then
  778. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  779. end
  780. else
  781. result:=false;
  782. end;
  783. procedure tcgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  784. var
  785. shift, lsb, width : byte;
  786. tmpreg : tregister;
  787. so : tshifterop;
  788. l1 : longint;
  789. imm1, imm2: DWord;
  790. begin
  791. optimize_op_const(size, op, a);
  792. case op of
  793. OP_NONE:
  794. begin
  795. if src <> dst then
  796. a_load_reg_reg(list, size, size, src, dst);
  797. exit;
  798. end;
  799. OP_MOVE:
  800. begin
  801. a_load_const_reg(list, size, a, dst);
  802. exit;
  803. end;
  804. end;
  805. ovloc.loc:=LOC_VOID;
  806. if {$ifopt R+}(a<>-2147483648) and{$endif} not setflags and is_shifter_const(-a,shift) then
  807. case op of
  808. OP_ADD:
  809. begin
  810. op:=OP_SUB;
  811. a:=aint(dword(-a));
  812. end;
  813. OP_SUB:
  814. begin
  815. op:=OP_ADD;
  816. a:=aint(dword(-a));
  817. end
  818. end;
  819. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  820. case op of
  821. OP_NEG,OP_NOT:
  822. internalerror(200308281);
  823. OP_SHL,
  824. OP_SHR,
  825. OP_ROL,
  826. OP_ROR,
  827. OP_SAR:
  828. begin
  829. if a>32 then
  830. internalerror(200308294);
  831. shifterop_reset(so);
  832. so.shiftmode:=opshift2shiftmode(op);
  833. if op = OP_ROL then
  834. so.shiftimm:=32-a
  835. else
  836. so.shiftimm:=a;
  837. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  838. end;
  839. else
  840. {if (op in [OP_SUB, OP_ADD]) and
  841. ((a < 0) or
  842. (a > 4095)) then
  843. begin
  844. tmpreg:=getintregister(list,size);
  845. list.concat(taicpu.op_reg_const(A_MOVT, tmpreg, (a shr 16) and $FFFF));
  846. list.concat(taicpu.op_reg_const(A_MOV, tmpreg, a and $FFFF));
  847. list.concat(setoppostfix(taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))
  848. ));
  849. end
  850. else}
  851. begin
  852. if cgsetflags or setflags then
  853. a_reg_alloc(list,NR_DEFAULTFLAGS);
  854. list.concat(setoppostfix(
  855. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  856. end;
  857. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  858. begin
  859. ovloc.loc:=LOC_FLAGS;
  860. case op of
  861. OP_ADD:
  862. ovloc.resflags:=F_CS;
  863. OP_SUB:
  864. ovloc.resflags:=F_CC;
  865. end;
  866. end;
  867. end
  868. else
  869. begin
  870. { there could be added some more sophisticated optimizations }
  871. if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  872. a_op_reg_reg(list,OP_NEG,size,src,dst)
  873. { we do this here instead in the peephole optimizer because
  874. it saves us a register }
  875. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  876. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  877. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  878. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  879. begin
  880. if l1>32 then{roozbeh does this ever happen?}
  881. internalerror(200308296);
  882. shifterop_reset(so);
  883. so.shiftmode:=SM_LSL;
  884. so.shiftimm:=l1;
  885. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  886. end
  887. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  888. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  889. begin
  890. if l1>32 then{does this ever happen?}
  891. internalerror(201205181);
  892. shifterop_reset(so);
  893. so.shiftmode:=SM_LSL;
  894. so.shiftimm:=l1;
  895. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  896. end
  897. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  898. begin
  899. { nothing to do on success }
  900. end
  901. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  902. broader range of shifterconstants.}
  903. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  904. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  905. { Doing two shifts instead of two bics might allow the peephole optimizer to fold the second shift
  906. into the following instruction}
  907. else if (op = OP_AND) and
  908. is_continuous_mask(a, lsb, width) and
  909. ((lsb = 0) or ((lsb + width) = 32)) then
  910. begin
  911. shifterop_reset(so);
  912. if (width = 16) and
  913. (lsb = 0) and
  914. (current_settings.cputype >= cpu_armv6) then
  915. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  916. else if (width = 8) and
  917. (lsb = 0) and
  918. (current_settings.cputype >= cpu_armv6) then
  919. list.concat(taicpu.op_reg_reg(A_UXTB,dst,src))
  920. else if lsb = 0 then
  921. begin
  922. so.shiftmode:=SM_LSL;
  923. so.shiftimm:=32-width;
  924. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  925. so.shiftmode:=SM_LSR;
  926. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  927. end
  928. else
  929. begin
  930. so.shiftmode:=SM_LSR;
  931. so.shiftimm:=lsb;
  932. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  933. so.shiftmode:=SM_LSL;
  934. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  935. end;
  936. end
  937. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  938. begin
  939. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,imm1));
  940. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  941. end
  942. else if (op in [OP_ADD, OP_SUB, OP_OR, OP_XOR]) and
  943. not(cgsetflags or setflags) and
  944. split_into_shifter_const(a, imm1, imm2) then
  945. begin
  946. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,imm1));
  947. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  948. end
  949. else
  950. begin
  951. tmpreg:=getintregister(list,size);
  952. a_load_const_reg(list,size,a,tmpreg);
  953. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  954. end;
  955. end;
  956. maybeadjustresult(list,op,size,dst);
  957. end;
  958. procedure tcgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  959. var
  960. so : tshifterop;
  961. tmpreg,overflowreg : tregister;
  962. asmop : tasmop;
  963. begin
  964. ovloc.loc:=LOC_VOID;
  965. case op of
  966. OP_NEG,OP_NOT,
  967. OP_DIV,OP_IDIV:
  968. internalerror(200308283);
  969. OP_SHL,
  970. OP_SHR,
  971. OP_SAR,
  972. OP_ROR:
  973. begin
  974. if (op = OP_ROR) and not(size in [OS_32,OS_S32]) then
  975. internalerror(2008072801);
  976. shifterop_reset(so);
  977. so.rs:=src1;
  978. so.shiftmode:=opshift2shiftmode(op);
  979. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  980. end;
  981. OP_ROL:
  982. begin
  983. if not(size in [OS_32,OS_S32]) then
  984. internalerror(2008072801);
  985. { simulate ROL by ror'ing 32-value }
  986. tmpreg:=getintregister(list,OS_32);
  987. list.concat(taicpu.op_reg_reg_const(A_RSB,tmpreg,src1, 32));
  988. shifterop_reset(so);
  989. so.rs:=tmpreg;
  990. so.shiftmode:=SM_ROR;
  991. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  992. end;
  993. OP_IMUL,
  994. OP_MUL:
  995. begin
  996. if (cgsetflags or setflags) and
  997. (CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype]) then
  998. begin
  999. overflowreg:=getintregister(list,size);
  1000. if op=OP_IMUL then
  1001. asmop:=A_SMULL
  1002. else
  1003. asmop:=A_UMULL;
  1004. { the arm doesn't allow that rd and rm are the same }
  1005. if dst=src2 then
  1006. begin
  1007. if dst<>src1 then
  1008. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  1009. else
  1010. begin
  1011. tmpreg:=getintregister(list,size);
  1012. a_load_reg_reg(list,size,size,src2,dst);
  1013. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  1014. end;
  1015. end
  1016. else
  1017. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  1018. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1019. if op=OP_IMUL then
  1020. begin
  1021. shifterop_reset(so);
  1022. so.shiftmode:=SM_ASR;
  1023. so.shiftimm:=31;
  1024. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  1025. end
  1026. else
  1027. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  1028. ovloc.loc:=LOC_FLAGS;
  1029. ovloc.resflags:=F_NE;
  1030. end
  1031. else
  1032. begin
  1033. { the arm doesn't allow that rd and rm are the same }
  1034. if dst=src2 then
  1035. begin
  1036. if dst<>src1 then
  1037. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  1038. else
  1039. begin
  1040. tmpreg:=getintregister(list,size);
  1041. a_load_reg_reg(list,size,size,src2,dst);
  1042. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  1043. end;
  1044. end
  1045. else
  1046. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  1047. end;
  1048. end;
  1049. else
  1050. begin
  1051. if cgsetflags or setflags then
  1052. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1053. list.concat(setoppostfix(
  1054. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  1055. end;
  1056. end;
  1057. maybeadjustresult(list,op,size,dst);
  1058. end;
  1059. procedure tcgarm.a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister);
  1060. var
  1061. asmop: tasmop;
  1062. begin
  1063. if CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype] then
  1064. begin
  1065. list.concat(tai_comment.create(strpnew('tcgarm.a_mul_reg_reg_pair called')));
  1066. case size of
  1067. OS_32: asmop:=A_UMULL;
  1068. OS_S32: asmop:=A_SMULL;
  1069. else
  1070. InternalError(2014060802);
  1071. end;
  1072. { The caller might omit dstlo or dsthi, when he is not interested in it, we still
  1073. need valid registers everywhere. In case of dsthi = NR_NO we could fall back to
  1074. 32x32=32 bit multiplication}
  1075. if (dstlo = NR_NO) then
  1076. dstlo:=getintregister(list,size);
  1077. if (dsthi = NR_NO) then
  1078. dsthi:=getintregister(list,size);
  1079. list.concat(taicpu.op_reg_reg_reg_reg(asmop, dstlo, dsthi, src1,src2));
  1080. end
  1081. else if dsthi=NR_NO then
  1082. begin
  1083. if (dstlo = NR_NO) then
  1084. dstlo:=getintregister(list,size);
  1085. list.concat(taicpu.op_reg_reg_reg(A_MUL, dstlo, src1,src2));
  1086. end
  1087. else
  1088. begin
  1089. internalerror(2015083022);
  1090. end;
  1091. end;
  1092. function tbasecgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  1093. var
  1094. tmpreg1,tmpreg2 : tregister;
  1095. begin
  1096. tmpreg1:=NR_NO;
  1097. { Be sure to have a base register }
  1098. if (ref.base=NR_NO) then
  1099. begin
  1100. if ref.shiftmode<>SM_None then
  1101. internalerror(2014020701);
  1102. ref.base:=ref.index;
  1103. ref.index:=NR_NO;
  1104. end;
  1105. { absolute symbols can't be handled directly, we've to store the symbol reference
  1106. in the text segment and access it pc relative
  1107. For now, we assume that references where base or index equals to PC are already
  1108. relative, all other references are assumed to be absolute and thus they need
  1109. to be handled extra.
  1110. A proper solution would be to change refoptions to a set and store the information
  1111. if the symbol is absolute or relative there.
  1112. }
  1113. if (assigned(ref.symbol) and
  1114. not(is_pc(ref.base)) and
  1115. not(is_pc(ref.index))
  1116. ) or
  1117. { [#xxx] isn't a valid address operand }
  1118. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  1119. (ref.offset<-4095) or
  1120. (ref.offset>4095) or
  1121. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  1122. ((ref.offset<-255) or
  1123. (ref.offset>255)
  1124. )
  1125. ) or
  1126. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1127. ((ref.offset<-1020) or
  1128. (ref.offset>1020) or
  1129. ((abs(ref.offset) mod 4)<>0)
  1130. )
  1131. ) or
  1132. ((GenerateThumbCode) and
  1133. (((oppostfix in [PF_SB,PF_SH]) and (ref.offset<>0)) or
  1134. ((oppostfix=PF_None) and ((ref.offset<0) or ((ref.base<>NR_STACK_POINTER_REG) and (ref.offset>124)) or
  1135. ((ref.base=NR_STACK_POINTER_REG) and (ref.offset>1020)) or ((ref.offset mod 4)<>0))) or
  1136. ((oppostfix=PF_H) and ((ref.offset<0) or (ref.offset>62) or ((ref.offset mod 2)<>0) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0)))) or
  1137. ((oppostfix=PF_B) and ((ref.offset<0) or (ref.offset>31) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0))))
  1138. )
  1139. ) then
  1140. begin
  1141. fixref(list,ref);
  1142. end;
  1143. if GenerateThumbCode then
  1144. begin
  1145. { certain thumb load require base and index }
  1146. if (oppostfix in [PF_SB,PF_SH]) and
  1147. (ref.base<>NR_NO) and (ref.index=NR_NO) then
  1148. begin
  1149. tmpreg1:=getintregister(list,OS_ADDR);
  1150. a_load_const_reg(list,OS_ADDR,0,tmpreg1);
  1151. ref.index:=tmpreg1;
  1152. end;
  1153. { "hi" registers cannot be used as base or index }
  1154. if (getsupreg(ref.base) in [RS_R8..RS_R12,RS_R14]) or
  1155. ((ref.base=NR_R13) and (ref.index<>NR_NO)) then
  1156. begin
  1157. tmpreg1:=getintregister(list,OS_ADDR);
  1158. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.base,tmpreg1);
  1159. ref.base:=tmpreg1;
  1160. end;
  1161. if getsupreg(ref.index) in [RS_R8..RS_R14] then
  1162. begin
  1163. tmpreg1:=getintregister(list,OS_ADDR);
  1164. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.index,tmpreg1);
  1165. ref.index:=tmpreg1;
  1166. end;
  1167. end;
  1168. { fold if there is base, index and offset, however, don't fold
  1169. for vfp memory instructions because we later fold the index }
  1170. if not((op in [A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1171. (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  1172. begin
  1173. if tmpreg1<>NR_NO then
  1174. begin
  1175. tmpreg2:=getintregister(list,OS_ADDR);
  1176. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg1,tmpreg2);
  1177. tmpreg1:=tmpreg2;
  1178. end
  1179. else
  1180. begin
  1181. tmpreg1:=getintregister(list,OS_ADDR);
  1182. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg1);
  1183. ref.base:=tmpreg1;
  1184. end;
  1185. ref.offset:=0;
  1186. end;
  1187. { floating point operations have only limited references
  1188. we expect here, that a base is already set }
  1189. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  1190. begin
  1191. if ref.shiftmode<>SM_none then
  1192. internalerror(200309121);
  1193. if tmpreg1<>NR_NO then
  1194. begin
  1195. if ref.base=tmpreg1 then
  1196. begin
  1197. if ref.signindex<0 then
  1198. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,tmpreg1,ref.index))
  1199. else
  1200. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,tmpreg1,ref.index));
  1201. ref.index:=NR_NO;
  1202. end
  1203. else
  1204. begin
  1205. if ref.index<>tmpreg1 then
  1206. internalerror(200403161);
  1207. if ref.signindex<0 then
  1208. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,ref.base,tmpreg1))
  1209. else
  1210. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,tmpreg1));
  1211. ref.base:=tmpreg1;
  1212. ref.index:=NR_NO;
  1213. end;
  1214. end
  1215. else
  1216. begin
  1217. tmpreg1:=getintregister(list,OS_ADDR);
  1218. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,ref.index));
  1219. ref.base:=tmpreg1;
  1220. ref.index:=NR_NO;
  1221. end;
  1222. end;
  1223. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  1224. Result := ref;
  1225. end;
  1226. procedure tbasecgarm.a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);
  1227. var
  1228. oppostfix:toppostfix;
  1229. usedtmpref: treference;
  1230. tmpreg : tregister;
  1231. dir : integer;
  1232. begin
  1233. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  1234. FromSize := ToSize;
  1235. case ToSize of
  1236. { signed integer registers }
  1237. OS_8,
  1238. OS_S8:
  1239. oppostfix:=PF_B;
  1240. OS_16,
  1241. OS_S16:
  1242. oppostfix:=PF_H;
  1243. OS_32,
  1244. OS_S32,
  1245. { for vfp value stored in integer register }
  1246. OS_F32:
  1247. oppostfix:=PF_None;
  1248. else
  1249. InternalError(200308299);
  1250. end;
  1251. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[tosize])) or
  1252. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  1253. (oppostfix =PF_H)) then
  1254. begin
  1255. if target_info.endian=endian_big then
  1256. dir:=-1
  1257. else
  1258. dir:=1;
  1259. case FromSize of
  1260. OS_16,OS_S16:
  1261. begin
  1262. tmpreg:=getintregister(list,OS_INT);
  1263. usedtmpref:=ref;
  1264. if target_info.endian=endian_big then
  1265. inc(usedtmpref.offset,1);
  1266. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1267. inc(usedtmpref.offset,dir);
  1268. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1269. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1270. end;
  1271. OS_32,OS_S32:
  1272. begin
  1273. tmpreg:=getintregister(list,OS_INT);
  1274. usedtmpref:=ref;
  1275. if ref.alignment=2 then
  1276. begin
  1277. if target_info.endian=endian_big then
  1278. inc(usedtmpref.offset,2);
  1279. usedtmpref:=a_internal_load_reg_ref(list,OS_16,OS_16,reg,usedtmpref);
  1280. a_op_const_reg_reg(list,OP_SHR,OS_INT,16,reg,tmpreg);
  1281. inc(usedtmpref.offset,dir*2);
  1282. a_internal_load_reg_ref(list,OS_16,OS_16,tmpreg,usedtmpref);
  1283. end
  1284. else
  1285. begin
  1286. if target_info.endian=endian_big then
  1287. inc(usedtmpref.offset,3);
  1288. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1289. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1290. inc(usedtmpref.offset,dir);
  1291. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1292. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1293. inc(usedtmpref.offset,dir);
  1294. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1295. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1296. inc(usedtmpref.offset,dir);
  1297. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1298. end;
  1299. end
  1300. else
  1301. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1302. end;
  1303. end
  1304. else
  1305. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1306. end;
  1307. function tbasecgarm.a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  1308. var
  1309. oppostfix:toppostfix;
  1310. href: treference;
  1311. tmpreg: TRegister;
  1312. begin
  1313. case ToSize of
  1314. { signed integer registers }
  1315. OS_8,
  1316. OS_S8:
  1317. oppostfix:=PF_B;
  1318. OS_16,
  1319. OS_S16:
  1320. oppostfix:=PF_H;
  1321. OS_32,
  1322. OS_S32:
  1323. oppostfix:=PF_None;
  1324. else
  1325. InternalError(2003082910);
  1326. end;
  1327. if (tosize in [OS_S16,OS_16]) and
  1328. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1329. begin
  1330. result:=handle_load_store(list,A_STR,PF_B,reg,ref);
  1331. tmpreg:=getintregister(list,OS_INT);
  1332. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1333. href:=result;
  1334. inc(href.offset);
  1335. handle_load_store(list,A_STR,PF_B,tmpreg,href);
  1336. end
  1337. else
  1338. result:=handle_load_store(list,A_STR,oppostfix,reg,ref);
  1339. end;
  1340. function tbasecgarm.a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  1341. var
  1342. oppostfix:toppostfix;
  1343. so: tshifterop;
  1344. tmpreg: TRegister;
  1345. href: treference;
  1346. begin
  1347. case FromSize of
  1348. { signed integer registers }
  1349. OS_8:
  1350. oppostfix:=PF_B;
  1351. OS_S8:
  1352. oppostfix:=PF_SB;
  1353. OS_16:
  1354. oppostfix:=PF_H;
  1355. OS_S16:
  1356. oppostfix:=PF_SH;
  1357. OS_32,
  1358. OS_S32:
  1359. oppostfix:=PF_None;
  1360. else
  1361. InternalError(200308291);
  1362. end;
  1363. if (tosize=OS_S8) and
  1364. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1365. begin
  1366. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1367. a_load_reg_reg(list,OS_S8,OS_32,reg,reg);
  1368. end
  1369. else if (tosize in [OS_S16,OS_16]) and
  1370. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1371. begin
  1372. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1373. tmpreg:=getintregister(list,OS_INT);
  1374. href:=result;
  1375. inc(href.offset);
  1376. handle_load_store(list,A_LDR,PF_B,tmpreg,href);
  1377. shifterop_reset(so);
  1378. so.shiftmode:=SM_LSL;
  1379. so.shiftimm:=8;
  1380. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  1381. end
  1382. else
  1383. result:=handle_load_store(list,A_LDR,oppostfix,reg,ref);
  1384. end;
  1385. procedure tbasecgarm.a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);
  1386. var
  1387. so : tshifterop;
  1388. procedure do_shift(shiftmode : tshiftmode; shiftimm : byte; reg : tregister);
  1389. begin
  1390. if GenerateThumbCode then
  1391. begin
  1392. case shiftmode of
  1393. SM_ASR:
  1394. a_op_const_reg_reg(list,OP_SAR,OS_32,shiftimm,reg,reg2);
  1395. SM_LSR:
  1396. a_op_const_reg_reg(list,OP_SHR,OS_32,shiftimm,reg,reg2);
  1397. SM_LSL:
  1398. a_op_const_reg_reg(list,OP_SHL,OS_32,shiftimm,reg,reg2);
  1399. else
  1400. internalerror(2013090301);
  1401. end;
  1402. end
  1403. else
  1404. begin
  1405. so.shiftmode:=shiftmode;
  1406. so.shiftimm:=shiftimm;
  1407. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,reg2,reg,so));
  1408. end;
  1409. end;
  1410. var
  1411. instr: taicpu;
  1412. conv_done: boolean;
  1413. begin
  1414. if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then
  1415. internalerror(2002090901);
  1416. conv_done:=false;
  1417. if tosize<>fromsize then
  1418. begin
  1419. shifterop_reset(so);
  1420. conv_done:=true;
  1421. if tcgsize2size[tosize]<=tcgsize2size[fromsize] then
  1422. fromsize:=tosize;
  1423. if current_settings.cputype<cpu_armv6 then
  1424. case fromsize of
  1425. OS_8:
  1426. if GenerateThumbCode then
  1427. a_op_const_reg_reg(list,OP_AND,OS_32,$ff,reg1,reg2)
  1428. else
  1429. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1430. OS_S8:
  1431. begin
  1432. do_shift(SM_LSL,24,reg1);
  1433. if tosize=OS_16 then
  1434. begin
  1435. do_shift(SM_ASR,8,reg2);
  1436. do_shift(SM_LSR,16,reg2);
  1437. end
  1438. else
  1439. do_shift(SM_ASR,24,reg2);
  1440. end;
  1441. OS_16:
  1442. begin
  1443. do_shift(SM_LSL,16,reg1);
  1444. do_shift(SM_LSR,16,reg2);
  1445. end;
  1446. OS_S16:
  1447. begin
  1448. do_shift(SM_LSL,16,reg1);
  1449. do_shift(SM_ASR,16,reg2)
  1450. end;
  1451. else
  1452. conv_done:=false;
  1453. end
  1454. else
  1455. case fromsize of
  1456. OS_8:
  1457. if GenerateThumbCode then
  1458. list.concat(taicpu.op_reg_reg(A_UXTB,reg2,reg1))
  1459. else
  1460. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1461. OS_S8:
  1462. begin
  1463. if tosize=OS_16 then
  1464. begin
  1465. so.shiftmode:=SM_ROR;
  1466. so.shiftimm:=16;
  1467. list.concat(taicpu.op_reg_reg_shifterop(A_SXTB16,reg2,reg1,so));
  1468. do_shift(SM_LSR,16,reg2);
  1469. end
  1470. else
  1471. list.concat(taicpu.op_reg_reg(A_SXTB,reg2,reg1));
  1472. end;
  1473. OS_16:
  1474. list.concat(taicpu.op_reg_reg(A_UXTH,reg2,reg1));
  1475. OS_S16:
  1476. list.concat(taicpu.op_reg_reg(A_SXTH,reg2,reg1));
  1477. else
  1478. conv_done:=false;
  1479. end
  1480. end;
  1481. if not conv_done and (reg1<>reg2) then
  1482. begin
  1483. { same size, only a register mov required }
  1484. instr:=taicpu.op_reg_reg(A_MOV,reg2,reg1);
  1485. list.Concat(instr);
  1486. { Notify the register allocator that we have written a move instruction so
  1487. it can try to eliminate it. }
  1488. add_move_instruction(instr);
  1489. end;
  1490. end;
  1491. procedure tbasecgarm.a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);
  1492. var
  1493. href,href2 : treference;
  1494. hloc : pcgparalocation;
  1495. begin
  1496. href:=ref;
  1497. hloc:=paraloc.location;
  1498. while assigned(hloc) do
  1499. begin
  1500. case hloc^.loc of
  1501. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  1502. begin
  1503. paramanager.allocparaloc(list,paraloc.location);
  1504. a_loadfpu_ref_reg(list,size,size,ref,hloc^.register);
  1505. end;
  1506. LOC_REGISTER :
  1507. case hloc^.size of
  1508. OS_32,
  1509. OS_F32:
  1510. begin
  1511. paramanager.allocparaloc(list,paraloc.location);
  1512. a_load_ref_reg(list,OS_32,OS_32,href,hloc^.register);
  1513. end;
  1514. OS_64,
  1515. OS_F64:
  1516. cg64.a_load64_ref_cgpara(list,href,paraloc);
  1517. else
  1518. a_load_ref_reg(list,hloc^.size,hloc^.size,href,hloc^.register);
  1519. end;
  1520. LOC_REFERENCE :
  1521. begin
  1522. reference_reset_base(href2,hloc^.reference.index,hloc^.reference.offset,paraloc.alignment,[]);
  1523. { concatcopy should choose the best way to copy the data }
  1524. g_concatcopy(list,href,href2,tcgsize2size[hloc^.size]);
  1525. end;
  1526. else
  1527. internalerror(200408241);
  1528. end;
  1529. inc(href.offset,tcgsize2size[hloc^.size]);
  1530. hloc:=hloc^.next;
  1531. end;
  1532. end;
  1533. procedure tbasecgarm.a_loadfpu_reg_reg(list: TAsmList; fromsize,tosize: tcgsize; reg1, reg2: tregister);
  1534. begin
  1535. list.concat(setoppostfix(taicpu.op_reg_reg(A_MVF,reg2,reg1),cgsize2fpuoppostfix[tosize]));
  1536. end;
  1537. procedure tbasecgarm.a_loadfpu_ref_reg(list: TAsmList; fromsize,tosize: tcgsize; const ref: treference; reg: tregister);
  1538. var
  1539. oppostfix:toppostfix;
  1540. begin
  1541. case fromsize of
  1542. OS_32,
  1543. OS_F32:
  1544. oppostfix:=PF_S;
  1545. OS_64,
  1546. OS_F64:
  1547. oppostfix:=PF_D;
  1548. OS_F80:
  1549. oppostfix:=PF_E;
  1550. else
  1551. InternalError(200309021);
  1552. end;
  1553. handle_load_store(list,A_LDF,oppostfix,reg,ref);
  1554. if fromsize<>tosize then
  1555. a_loadfpu_reg_reg(list,fromsize,tosize,reg,reg);
  1556. end;
  1557. procedure tbasecgarm.a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);
  1558. var
  1559. oppostfix:toppostfix;
  1560. begin
  1561. case tosize of
  1562. OS_F32:
  1563. oppostfix:=PF_S;
  1564. OS_F64:
  1565. oppostfix:=PF_D;
  1566. OS_F80:
  1567. oppostfix:=PF_E;
  1568. else
  1569. InternalError(200309022);
  1570. end;
  1571. handle_load_store(list,A_STF,oppostfix,reg,ref);
  1572. end;
  1573. { comparison operations }
  1574. procedure tbasecgarm.a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  1575. l : tasmlabel);
  1576. var
  1577. tmpreg : tregister;
  1578. b : byte;
  1579. begin
  1580. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1581. if (not(GenerateThumbCode) and is_shifter_const(a,b)) or
  1582. ((GenerateThumbCode) and is_thumb_imm(a)) then
  1583. list.concat(taicpu.op_reg_const(A_CMP,reg,a))
  1584. { CMN reg,0 and CMN reg,$80000000 are different from CMP reg,$ffffffff
  1585. and CMP reg,$7fffffff regarding the flags according to the ARM manual }
  1586. else if (a<>$7fffffff) and (a<>-1) and not(GenerateThumbCode) and is_shifter_const(-a,b) then
  1587. list.concat(taicpu.op_reg_const(A_CMN,reg,-a))
  1588. else
  1589. begin
  1590. tmpreg:=getintregister(list,size);
  1591. a_load_const_reg(list,size,a,tmpreg);
  1592. list.concat(taicpu.op_reg_reg(A_CMP,reg,tmpreg));
  1593. end;
  1594. a_jmp_cond(list,cmp_op,l);
  1595. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1596. end;
  1597. procedure tbasecgarm.a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister);
  1598. begin
  1599. if reverse then
  1600. begin
  1601. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,src));
  1602. list.Concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,31));
  1603. list.Concat(taicpu.op_reg_reg_const(A_AND,dst,dst,255));
  1604. end
  1605. { it is decided during the compilation of the system unit if this code is used or not
  1606. so no additional check for rbit is needed }
  1607. else
  1608. begin
  1609. list.Concat(taicpu.op_reg_reg(A_RBIT,dst,src));
  1610. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,dst));
  1611. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1612. list.Concat(taicpu.op_reg_const(A_CMP,dst,32));
  1613. if GenerateThumb2Code then
  1614. list.Concat(taicpu.op_cond(A_IT, C_EQ));
  1615. list.Concat(setcondition(taicpu.op_reg_const(A_MOV,dst,$ff),C_EQ));
  1616. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1617. end;
  1618. end;
  1619. procedure tbasecgarm.a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel);
  1620. begin
  1621. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1622. list.concat(taicpu.op_reg_reg(A_CMP,reg2,reg1));
  1623. a_jmp_cond(list,cmp_op,l);
  1624. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1625. end;
  1626. procedure tbasecgarm.a_jmp_name(list : TAsmList;const s : string);
  1627. var
  1628. ai : taicpu;
  1629. begin
  1630. { generate far jump, leave it to the optimizer to get rid of it }
  1631. if GenerateThumbCode then
  1632. ai:=taicpu.op_sym(A_BL,current_asmdata.RefAsmSymbol(s,AT_FUNCTION))
  1633. else
  1634. ai:=taicpu.op_sym(A_B,current_asmdata.RefAsmSymbol(s,AT_FUNCTION));
  1635. ai.is_jmp:=true;
  1636. list.concat(ai);
  1637. end;
  1638. procedure tbasecgarm.a_jmp_always(list : TAsmList;l: tasmlabel);
  1639. var
  1640. ai : taicpu;
  1641. begin
  1642. { generate far jump, leave it to the optimizer to get rid of it }
  1643. if GenerateThumbCode then
  1644. ai:=taicpu.op_sym(A_BL,l)
  1645. else
  1646. ai:=taicpu.op_sym(A_B,l);
  1647. ai.is_jmp:=true;
  1648. list.concat(ai);
  1649. end;
  1650. procedure tbasecgarm.a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel);
  1651. var
  1652. ai : taicpu;
  1653. inv_flags : TResFlags;
  1654. hlabel : TAsmLabel;
  1655. begin
  1656. if GenerateThumbCode then
  1657. begin
  1658. inv_flags:=f;
  1659. inverse_flags(inv_flags);
  1660. { the optimizer has to fix this if jump range is sufficient short }
  1661. current_asmdata.getjumplabel(hlabel);
  1662. ai:=setcondition(taicpu.op_sym(A_B,hlabel),flags_to_cond(inv_flags));
  1663. ai.is_jmp:=true;
  1664. list.concat(ai);
  1665. a_jmp_always(list,l);
  1666. a_label(list,hlabel);
  1667. end
  1668. else
  1669. begin
  1670. ai:=setcondition(taicpu.op_sym(A_B,l),flags_to_cond(f));
  1671. ai.is_jmp:=true;
  1672. list.concat(ai);
  1673. end;
  1674. end;
  1675. procedure tbasecgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  1676. begin
  1677. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  1678. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  1679. end;
  1680. procedure tbasecgarm.g_profilecode(list : TAsmList);
  1681. begin
  1682. if target_info.system = system_arm_linux then
  1683. begin
  1684. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R14]));
  1685. a_call_name(list,'__gnu_mcount_nc',false);
  1686. end
  1687. else
  1688. internalerror(2014091201);
  1689. end;
  1690. procedure tbasecgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  1691. var
  1692. ref : treference;
  1693. shift : byte;
  1694. firstfloatreg,lastfloatreg,
  1695. r : byte;
  1696. mmregs,
  1697. regs, saveregs : tcpuregisterset;
  1698. registerarea,
  1699. r7offset,
  1700. stackmisalignment : pint;
  1701. imm1, imm2: DWord;
  1702. stack_parameters : Boolean;
  1703. begin
  1704. LocalSize:=align(LocalSize,4);
  1705. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  1706. { call instruction does not put anything on the stack }
  1707. registerarea:=0;
  1708. tcpuprocinfo(current_procinfo).stackpaddingreg:=High(TSuperRegister);
  1709. lastfloatreg:=RS_NO;
  1710. if not(nostackframe) then
  1711. begin
  1712. firstfloatreg:=RS_NO;
  1713. mmregs:=[];
  1714. case current_settings.fputype of
  1715. fpu_fpa,
  1716. fpu_fpa10,
  1717. fpu_fpa11:
  1718. begin
  1719. { save floating point registers? }
  1720. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1721. for r:=RS_F0 to RS_F7 do
  1722. if r in regs then
  1723. begin
  1724. if firstfloatreg=RS_NO then
  1725. firstfloatreg:=r;
  1726. lastfloatreg:=r;
  1727. inc(registerarea,12);
  1728. end;
  1729. end;
  1730. fpu_vfpv2,
  1731. fpu_vfpv3,
  1732. fpu_vfpv4,
  1733. fpu_vfpv3_d16:
  1734. begin;
  1735. { the *[0..31] is a hack to prevent that the compiler tries to save odd single-type registers,
  1736. they have numbers>$1f which is not really correct as they should simply have the same numbers
  1737. as the even ones by with a different subtype as it is done on x86 with al/ah }
  1738. mmregs:=(rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall))*[0..31];
  1739. end;
  1740. end;
  1741. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1742. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1743. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  1744. { save int registers }
  1745. reference_reset(ref,4,[]);
  1746. ref.index:=NR_STACK_POINTER_REG;
  1747. ref.addressmode:=AM_PREINDEXED;
  1748. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  1749. if not(target_info.system in systems_darwin) then
  1750. begin
  1751. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1752. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1753. begin
  1754. a_reg_alloc(list,NR_R12);
  1755. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  1756. end;
  1757. { the (old) ARM APCS requires saving both the stack pointer (to
  1758. crawl the stack) and the PC (to identify the function this
  1759. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  1760. and R15 -- still needs updating for EABI and Darwin, they don't
  1761. need that }
  1762. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1763. regs:=regs+[RS_FRAME_POINTER_REG,RS_R12,RS_R14,RS_R15]
  1764. else
  1765. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1766. include(regs,RS_R14);
  1767. if regs<>[] then
  1768. begin
  1769. for r:=RS_R0 to RS_R15 do
  1770. if r in regs then
  1771. inc(registerarea,4);
  1772. { if the stack is not 8 byte aligned, try to add an extra register,
  1773. so we can avoid the extra sub/add ...,#4 later (KB) }
  1774. if ((registerarea mod current_settings.alignment.localalignmax) <> 0) then
  1775. for r:=RS_R3 downto RS_R0 do
  1776. if not(r in regs) then
  1777. begin
  1778. regs:=regs+[r];
  1779. inc(registerarea,4);
  1780. tcpuprocinfo(current_procinfo).stackpaddingreg:=r;
  1781. break;
  1782. end;
  1783. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  1784. end;
  1785. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1786. begin
  1787. { the framepointer now points to the saved R15, so the saved
  1788. framepointer is at R11-12 (for get_caller_frame) }
  1789. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  1790. a_reg_dealloc(list,NR_R12);
  1791. end;
  1792. end
  1793. else
  1794. begin
  1795. { always save r14 if we use r7 as the framepointer, because
  1796. the parameter offsets are hardcoded in advance and always
  1797. assume that r14 sits on the stack right behind the saved r7
  1798. }
  1799. if current_procinfo.framepointer=NR_FRAME_POINTER_REG then
  1800. include(regs,RS_FRAME_POINTER_REG);
  1801. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1802. include(regs,RS_R14);
  1803. if regs<>[] then
  1804. begin
  1805. { on Darwin, you first have to save [r4-r7,lr], and then
  1806. [r8,r10,r11] and make r7 point to the previously saved
  1807. r7 so that you can perform a stack crawl based on it
  1808. ([r7] is previous stack frame, [r7+4] is return address
  1809. }
  1810. include(regs,RS_FRAME_POINTER_REG);
  1811. saveregs:=regs-[RS_R8,RS_R10,RS_R11];
  1812. r7offset:=0;
  1813. for r:=RS_R0 to RS_R15 do
  1814. if r in saveregs then
  1815. begin
  1816. inc(registerarea,4);
  1817. if r<RS_FRAME_POINTER_REG then
  1818. inc(r7offset,4);
  1819. end;
  1820. { save the registers }
  1821. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1822. { make r7 point to the saved r7 (regardless of whether this
  1823. frame uses the framepointer, for backtrace purposes) }
  1824. if r7offset<>0 then
  1825. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_FRAME_POINTER_REG,NR_R13,r7offset))
  1826. else
  1827. list.concat(taicpu.op_reg_reg(A_MOV,NR_R7,NR_R13));
  1828. { now save the rest (if any) }
  1829. saveregs:=regs-saveregs;
  1830. if saveregs<>[] then
  1831. begin
  1832. for r:=RS_R8 to RS_R11 do
  1833. if r in saveregs then
  1834. inc(registerarea,4);
  1835. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1836. end;
  1837. end;
  1838. end;
  1839. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  1840. if (LocalSize<>0) or
  1841. ((stackmisalignment<>0) and
  1842. ((pi_do_call in current_procinfo.flags) or
  1843. (po_assembler in current_procinfo.procdef.procoptions))) then
  1844. begin
  1845. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  1846. if stack_parameters and (pi_estimatestacksize in current_procinfo.flags) then
  1847. begin
  1848. if localsize>tcpuprocinfo(current_procinfo).stackframesize then
  1849. internalerror(2014030901)
  1850. else
  1851. localsize:=tcpuprocinfo(current_procinfo).stackframesize-registerarea;
  1852. end;
  1853. if is_shifter_const(localsize,shift) then
  1854. begin
  1855. a_reg_dealloc(list,NR_R12);
  1856. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  1857. end
  1858. else if split_into_shifter_const(localsize, imm1, imm2) then
  1859. begin
  1860. a_reg_dealloc(list,NR_R12);
  1861. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  1862. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  1863. end
  1864. else
  1865. begin
  1866. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  1867. a_reg_alloc(list,NR_R12);
  1868. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  1869. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  1870. a_reg_dealloc(list,NR_R12);
  1871. end;
  1872. end;
  1873. if (mmregs<>[]) or
  1874. (firstfloatreg<>RS_NO) then
  1875. begin
  1876. reference_reset(ref,4,[]);
  1877. if (tg.direction*tcpuprocinfo(current_procinfo).floatregstart>=1023) or
  1878. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv4,fpu_vfpv3_d16]) then
  1879. begin
  1880. if not is_shifter_const(tcpuprocinfo(current_procinfo).floatregstart,shift) then
  1881. begin
  1882. a_reg_alloc(list,NR_R12);
  1883. a_load_const_reg(list,OS_ADDR,-tcpuprocinfo(current_procinfo).floatregstart,NR_R12);
  1884. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1885. a_reg_dealloc(list,NR_R12);
  1886. end
  1887. else
  1888. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tcpuprocinfo(current_procinfo).floatregstart));
  1889. ref.base:=NR_R12;
  1890. end
  1891. else
  1892. begin
  1893. ref.base:=current_procinfo.framepointer;
  1894. ref.offset:=tcpuprocinfo(current_procinfo).floatregstart;
  1895. end;
  1896. case current_settings.fputype of
  1897. fpu_fpa,
  1898. fpu_fpa10,
  1899. fpu_fpa11:
  1900. begin
  1901. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  1902. lastfloatreg-firstfloatreg+1,ref));
  1903. end;
  1904. fpu_vfpv2,
  1905. fpu_vfpv3,
  1906. fpu_vfpv4,
  1907. fpu_vfpv3_d16:
  1908. begin
  1909. ref.index:=ref.base;
  1910. ref.base:=NR_NO;
  1911. { FSTMX is deprecated on ARMv6 and later }
  1912. {if (current_settings.cputype<cpu_armv6) then
  1913. postfix:=PF_IAX
  1914. else
  1915. postfix:=PF_IAD;}
  1916. if mmregs<>[] then
  1917. list.concat(taicpu.op_ref_regset(A_VSTM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  1918. end;
  1919. end;
  1920. end;
  1921. end;
  1922. end;
  1923. procedure tbasecgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  1924. var
  1925. ref : treference;
  1926. LocalSize : longint;
  1927. firstfloatreg,lastfloatreg,
  1928. r,
  1929. shift : byte;
  1930. mmregs,
  1931. saveregs,
  1932. regs : tcpuregisterset;
  1933. registerarea,
  1934. stackmisalignment: pint;
  1935. paddingreg: TSuperRegister;
  1936. imm1, imm2: DWord;
  1937. begin
  1938. if not(nostackframe) then
  1939. begin
  1940. registerarea:=0;
  1941. firstfloatreg:=RS_NO;
  1942. lastfloatreg:=RS_NO;
  1943. mmregs:=[];
  1944. saveregs:=[];
  1945. case current_settings.fputype of
  1946. fpu_fpa,
  1947. fpu_fpa10,
  1948. fpu_fpa11:
  1949. begin
  1950. { restore floating point registers? }
  1951. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1952. for r:=RS_F0 to RS_F7 do
  1953. if r in regs then
  1954. begin
  1955. if firstfloatreg=RS_NO then
  1956. firstfloatreg:=r;
  1957. lastfloatreg:=r;
  1958. { floating point register space is already included in
  1959. localsize below by calc_stackframe_size
  1960. inc(registerarea,12);
  1961. }
  1962. end;
  1963. end;
  1964. fpu_vfpv2,
  1965. fpu_vfpv3,
  1966. fpu_vfpv4,
  1967. fpu_vfpv3_d16:
  1968. begin;
  1969. { restore vfp registers? }
  1970. { the *[0..31] is a hack to prevent that the compiler tries to save odd single-type registers,
  1971. they have numbers>$1f which is not really correct as they should simply have the same numbers
  1972. as the even ones by with a different subtype as it is done on x86 with al/ah }
  1973. mmregs:=(rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall))*[0..31];
  1974. end;
  1975. end;
  1976. if (firstfloatreg<>RS_NO) or
  1977. (mmregs<>[]) then
  1978. begin
  1979. reference_reset(ref,4,[]);
  1980. if (tg.direction*tcpuprocinfo(current_procinfo).floatregstart>=1023) or
  1981. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv4,fpu_vfpv3_d16]) then
  1982. begin
  1983. if not is_shifter_const(tcpuprocinfo(current_procinfo).floatregstart,shift) then
  1984. begin
  1985. a_reg_alloc(list,NR_R12);
  1986. a_load_const_reg(list,OS_ADDR,-tcpuprocinfo(current_procinfo).floatregstart,NR_R12);
  1987. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1988. a_reg_dealloc(list,NR_R12);
  1989. end
  1990. else
  1991. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tcpuprocinfo(current_procinfo).floatregstart));
  1992. ref.base:=NR_R12;
  1993. end
  1994. else
  1995. begin
  1996. ref.base:=current_procinfo.framepointer;
  1997. ref.offset:=tcpuprocinfo(current_procinfo).floatregstart;
  1998. end;
  1999. case current_settings.fputype of
  2000. fpu_fpa,
  2001. fpu_fpa10,
  2002. fpu_fpa11:
  2003. begin
  2004. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  2005. lastfloatreg-firstfloatreg+1,ref));
  2006. end;
  2007. fpu_vfpv2,
  2008. fpu_vfpv3,
  2009. fpu_vfpv4,
  2010. fpu_vfpv3_d16:
  2011. begin
  2012. ref.index:=ref.base;
  2013. ref.base:=NR_NO;
  2014. { FLDMX is deprecated on ARMv6 and later }
  2015. {if (current_settings.cputype<cpu_armv6) then
  2016. mmpostfix:=PF_IAX
  2017. else
  2018. mmpostfix:=PF_IAD;}
  2019. if mmregs<>[] then
  2020. list.concat(taicpu.op_ref_regset(A_VLDM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  2021. end;
  2022. end;
  2023. end;
  2024. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  2025. if (pi_do_call in current_procinfo.flags) or
  2026. (regs<>[]) or
  2027. ((target_info.system in systems_darwin) and
  2028. (current_procinfo.framepointer<>NR_STACK_POINTER_REG)) then
  2029. begin
  2030. exclude(regs,RS_R14);
  2031. include(regs,RS_R15);
  2032. if (target_info.system in systems_darwin) then
  2033. include(regs,RS_FRAME_POINTER_REG);
  2034. end;
  2035. if not(target_info.system in systems_darwin) then
  2036. begin
  2037. { restore saved stack pointer to SP (R13) and saved lr to PC (R15).
  2038. The saved PC came after that but is discarded, since we restore
  2039. the stack pointer }
  2040. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  2041. regs:=regs+[RS_FRAME_POINTER_REG,RS_R13,RS_R15];
  2042. end
  2043. else
  2044. begin
  2045. { restore R8-R11 already if necessary (they've been stored
  2046. before the others) }
  2047. saveregs:=regs*[RS_R8,RS_R10,RS_R11];
  2048. if saveregs<>[] then
  2049. begin
  2050. reference_reset(ref,4,[]);
  2051. ref.index:=NR_STACK_POINTER_REG;
  2052. ref.addressmode:=AM_PREINDEXED;
  2053. for r:=RS_R8 to RS_R11 do
  2054. if r in saveregs then
  2055. inc(registerarea,4);
  2056. regs:=regs-saveregs;
  2057. end;
  2058. end;
  2059. for r:=RS_R0 to RS_R15 do
  2060. if r in regs then
  2061. inc(registerarea,4);
  2062. { reapply the stack padding reg, in case there was one, see the complimentary
  2063. comment in g_proc_entry() (KB) }
  2064. paddingreg:=tcpuprocinfo(current_procinfo).stackpaddingreg;
  2065. if paddingreg < RS_R4 then
  2066. if paddingreg in regs then
  2067. internalerror(201306190)
  2068. else
  2069. begin
  2070. regs:=regs+[paddingreg];
  2071. inc(registerarea,4);
  2072. end;
  2073. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  2074. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  2075. (target_info.system in systems_darwin) then
  2076. begin
  2077. LocalSize:=current_procinfo.calc_stackframe_size;
  2078. if (LocalSize<>0) or
  2079. ((stackmisalignment<>0) and
  2080. ((pi_do_call in current_procinfo.flags) or
  2081. (po_assembler in current_procinfo.procdef.procoptions))) then
  2082. begin
  2083. if pi_estimatestacksize in current_procinfo.flags then
  2084. LocalSize:=tcpuprocinfo(current_procinfo).stackframesize-registerarea
  2085. else
  2086. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  2087. if is_shifter_const(LocalSize,shift) then
  2088. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  2089. else if split_into_shifter_const(localsize, imm1, imm2) then
  2090. begin
  2091. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  2092. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  2093. end
  2094. else
  2095. begin
  2096. a_reg_alloc(list,NR_R12);
  2097. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  2098. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  2099. a_reg_dealloc(list,NR_R12);
  2100. end;
  2101. end;
  2102. if (target_info.system in systems_darwin) and
  2103. (saveregs<>[]) then
  2104. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  2105. if regs=[] then
  2106. begin
  2107. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2108. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2109. else
  2110. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2111. end
  2112. else
  2113. begin
  2114. reference_reset(ref,4,[]);
  2115. ref.index:=NR_STACK_POINTER_REG;
  2116. ref.addressmode:=AM_PREINDEXED;
  2117. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  2118. end;
  2119. end
  2120. else
  2121. begin
  2122. { restore int registers and return }
  2123. reference_reset(ref,4,[]);
  2124. ref.index:=NR_FRAME_POINTER_REG;
  2125. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_EA));
  2126. end;
  2127. end
  2128. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2129. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2130. else
  2131. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2132. end;
  2133. procedure tbasecgarm.g_maybe_got_init(list : TAsmList);
  2134. var
  2135. ref : treference;
  2136. l : TAsmLabel;
  2137. regs : tcpuregisterset;
  2138. r: byte;
  2139. begin
  2140. if (cs_create_pic in current_settings.moduleswitches) and
  2141. (pi_needs_got in current_procinfo.flags) and
  2142. (tf_pic_uses_got in target_info.flags) then
  2143. begin
  2144. { Procedure parametrs are not initialized at this stage.
  2145. Before GOT initialization code, allocate registers used for procedure parameters
  2146. to prevent usage of these registers for temp operations in later stages of code
  2147. generation. }
  2148. regs:=rg[R_INTREGISTER].used_in_proc;
  2149. for r:=RS_R0 to RS_R3 do
  2150. if r in regs then
  2151. a_reg_alloc(list, newreg(R_INTREGISTER,r,R_SUBWHOLE));
  2152. { Allocate scratch register R12 and use it for GOT calculations directly.
  2153. Otherwise the init code can be distorted in later stages of code generation. }
  2154. a_reg_alloc(list,NR_R12);
  2155. reference_reset(ref,4,[]);
  2156. current_asmdata.getglobaldatalabel(l);
  2157. cg.a_label(current_procinfo.aktlocaldata,l);
  2158. ref.symbol:=l;
  2159. ref.base:=NR_PC;
  2160. ref.symboldata:=current_procinfo.aktlocaldata.last;
  2161. list.concat(Taicpu.op_reg_ref(A_LDR,NR_R12,ref));
  2162. current_asmdata.getaddrlabel(l);
  2163. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_32bit,l,current_asmdata.RefAsmSymbol('_GLOBAL_OFFSET_TABLE_',AT_DATA),-8));
  2164. cg.a_label(list,l);
  2165. list.concat(Taicpu.op_reg_reg_reg(A_ADD,NR_R12,NR_PC,NR_R12));
  2166. list.concat(Taicpu.op_reg_reg(A_MOV,current_procinfo.got,NR_R12));
  2167. { Deallocate registers }
  2168. a_reg_dealloc(list,NR_R12);
  2169. for r:=RS_R3 downto RS_R0 do
  2170. if r in regs then
  2171. a_reg_dealloc(list, newreg(R_INTREGISTER,r,R_SUBWHOLE));
  2172. end;
  2173. end;
  2174. procedure tbasecgarm.a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);
  2175. var
  2176. b : byte;
  2177. tmpref : treference;
  2178. instr : taicpu;
  2179. begin
  2180. if ref.addressmode<>AM_OFFSET then
  2181. internalerror(200309071);
  2182. tmpref:=ref;
  2183. { Be sure to have a base register }
  2184. if (tmpref.base=NR_NO) then
  2185. begin
  2186. if tmpref.shiftmode<>SM_None then
  2187. internalerror(2014020702);
  2188. if tmpref.signindex<0 then
  2189. internalerror(200312023);
  2190. tmpref.base:=tmpref.index;
  2191. tmpref.index:=NR_NO;
  2192. end;
  2193. if assigned(tmpref.symbol) or
  2194. not((is_shifter_const(tmpref.offset,b)) or
  2195. (is_shifter_const(-tmpref.offset,b))
  2196. ) then
  2197. fixref(list,tmpref);
  2198. { expect a base here if there is an index }
  2199. if (tmpref.base=NR_NO) and (tmpref.index<>NR_NO) then
  2200. internalerror(200312022);
  2201. if tmpref.index<>NR_NO then
  2202. begin
  2203. if tmpref.shiftmode<>SM_None then
  2204. internalerror(200312021);
  2205. if tmpref.signindex<0 then
  2206. a_op_reg_reg_reg(list,OP_SUB,OS_ADDR,tmpref.base,tmpref.index,r)
  2207. else
  2208. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpref.base,tmpref.index,r);
  2209. if tmpref.offset<>0 then
  2210. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,r,r);
  2211. end
  2212. else
  2213. begin
  2214. if tmpref.base=NR_NO then
  2215. a_load_const_reg(list,OS_ADDR,tmpref.offset,r)
  2216. else
  2217. if tmpref.offset<>0 then
  2218. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,tmpref.base,r)
  2219. else
  2220. begin
  2221. instr:=taicpu.op_reg_reg(A_MOV,r,tmpref.base);
  2222. list.concat(instr);
  2223. add_move_instruction(instr);
  2224. end;
  2225. end;
  2226. end;
  2227. procedure tbasecgarm.fixref(list : TAsmList;var ref : treference);
  2228. var
  2229. tmpreg, tmpreg2 : tregister;
  2230. tmpref : treference;
  2231. l, piclabel : tasmlabel;
  2232. indirection_done : boolean;
  2233. begin
  2234. { absolute symbols can't be handled directly, we've to store the symbol reference
  2235. in the text segment and access it pc relative
  2236. For now, we assume that references where base or index equals to PC are already
  2237. relative, all other references are assumed to be absolute and thus they need
  2238. to be handled extra.
  2239. A proper solution would be to change refoptions to a set and store the information
  2240. if the symbol is absolute or relative there.
  2241. }
  2242. { create consts entry }
  2243. reference_reset(tmpref,4,[]);
  2244. current_asmdata.getjumplabel(l);
  2245. cg.a_label(current_procinfo.aktlocaldata,l);
  2246. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  2247. piclabel:=nil;
  2248. tmpreg:=NR_NO;
  2249. indirection_done:=false;
  2250. if assigned(ref.symbol) then
  2251. begin
  2252. if (target_info.system=system_arm_darwin) and
  2253. (ref.symbol.bind in [AB_EXTERNAL,AB_WEAK_EXTERNAL,AB_PRIVATE_EXTERN,AB_COMMON]) then
  2254. begin
  2255. tmpreg:=g_indirect_sym_load(list,ref.symbol.name,asmsym2indsymflags(ref.symbol));
  2256. if ref.offset<>0 then
  2257. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2258. indirection_done:=true;
  2259. end
  2260. else if (cs_create_pic in current_settings.moduleswitches) then
  2261. if (tf_pic_uses_got in target_info.flags) then
  2262. current_procinfo.aktlocaldata.concat(tai_const.Create_type_sym(aitconst_got,ref.symbol))
  2263. else
  2264. begin
  2265. { ideally, we would want to generate
  2266. ldr r1, LPICConstPool
  2267. LPICLocal:
  2268. ldr/str r2,[pc,r1]
  2269. ...
  2270. LPICConstPool:
  2271. .long _globsym-(LPICLocal+8)
  2272. However, we cannot be sure that the ldr/str will follow
  2273. right after the call to fixref, so we have to load the
  2274. complete address already in a register.
  2275. }
  2276. current_asmdata.getaddrlabel(piclabel);
  2277. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_ptr,piclabel,ref.symbol,ref.offset-8));
  2278. end
  2279. else
  2280. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset))
  2281. end
  2282. else
  2283. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ref.offset));
  2284. { load consts entry }
  2285. if not indirection_done then
  2286. begin
  2287. tmpreg:=getintregister(list,OS_INT);
  2288. tmpref.symbol:=l;
  2289. tmpref.base:=NR_PC;
  2290. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2291. if (cs_create_pic in current_settings.moduleswitches) and
  2292. (tf_pic_uses_got in target_info.flags) and
  2293. assigned(ref.symbol) then
  2294. begin
  2295. reference_reset(tmpref,4,[]);
  2296. tmpref.base:=current_procinfo.got;
  2297. tmpref.index:=tmpreg;
  2298. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2299. if ref.offset<>0 then
  2300. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2301. end;
  2302. end;
  2303. if assigned(piclabel) then
  2304. begin
  2305. cg.a_label(list,piclabel);
  2306. tmpreg2:=getaddressregister(list);
  2307. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpreg,NR_PC,tmpreg2);
  2308. tmpreg:=tmpreg2
  2309. end;
  2310. { This routine can be called with PC as base/index in case the offset
  2311. was too large to encode in a load/store. In that case, the entire
  2312. absolute expression has been re-encoded in a new constpool entry, and
  2313. we have to remove the use of PC from the original reference (the code
  2314. above made everything relative to the value loaded from the new
  2315. constpool entry) }
  2316. if is_pc(ref.base) then
  2317. ref.base:=NR_NO;
  2318. if is_pc(ref.index) then
  2319. ref.index:=NR_NO;
  2320. if (ref.base<>NR_NO) then
  2321. begin
  2322. if ref.index<>NR_NO then
  2323. begin
  2324. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  2325. ref.base:=tmpreg;
  2326. end
  2327. else
  2328. if ref.base<>NR_PC then
  2329. begin
  2330. ref.index:=tmpreg;
  2331. ref.shiftimm:=0;
  2332. ref.signindex:=1;
  2333. ref.shiftmode:=SM_None;
  2334. end
  2335. else
  2336. ref.base:=tmpreg;
  2337. end
  2338. else
  2339. ref.base:=tmpreg;
  2340. ref.offset:=0;
  2341. ref.symbol:=nil;
  2342. end;
  2343. procedure tbasecgarm.g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  2344. var
  2345. paraloc1,paraloc2,paraloc3 : TCGPara;
  2346. pd : tprocdef;
  2347. begin
  2348. pd:=search_system_proc('MOVE');
  2349. paraloc1.init;
  2350. paraloc2.init;
  2351. paraloc3.init;
  2352. paramanager.getintparaloc(list,pd,1,paraloc1);
  2353. paramanager.getintparaloc(list,pd,2,paraloc2);
  2354. paramanager.getintparaloc(list,pd,3,paraloc3);
  2355. a_load_const_cgpara(list,OS_SINT,len,paraloc3);
  2356. a_loadaddr_ref_cgpara(list,dest,paraloc2);
  2357. a_loadaddr_ref_cgpara(list,source,paraloc1);
  2358. paramanager.freecgpara(list,paraloc3);
  2359. paramanager.freecgpara(list,paraloc2);
  2360. paramanager.freecgpara(list,paraloc1);
  2361. alloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2362. alloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2363. a_call_name(list,'FPC_MOVE',false);
  2364. dealloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2365. dealloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2366. paraloc3.done;
  2367. paraloc2.done;
  2368. paraloc1.done;
  2369. end;
  2370. procedure tbasecgarm.g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  2371. const
  2372. maxtmpreg_arm = 10; {roozbeh: can be reduced to 8 or lower if might conflick with reserved ones,also +2 is used becouse of regs required for referencing}
  2373. maxtmpreg_thumb = 5;
  2374. var
  2375. srcref,dstref,usedtmpref,usedtmpref2:treference;
  2376. srcreg,destreg,countreg,r,tmpreg:tregister;
  2377. helpsize:aint;
  2378. copysize:byte;
  2379. cgsize:Tcgsize;
  2380. tmpregisters:array[1..maxtmpreg_arm] of tregister;
  2381. maxtmpreg,
  2382. tmpregi,tmpregi2:byte;
  2383. { will never be called with count<=4 }
  2384. procedure genloop(count : aword;size : byte);
  2385. const
  2386. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2387. var
  2388. l : tasmlabel;
  2389. begin
  2390. current_asmdata.getjumplabel(l);
  2391. if count<size then size:=1;
  2392. a_load_const_reg(list,OS_INT,count div size,countreg);
  2393. cg.a_label(list,l);
  2394. srcref.addressmode:=AM_POSTINDEXED;
  2395. dstref.addressmode:=AM_POSTINDEXED;
  2396. srcref.offset:=size;
  2397. dstref.offset:=size;
  2398. r:=getintregister(list,size2opsize[size]);
  2399. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2400. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2401. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1),PF_S));
  2402. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2403. a_jmp_flags(list,F_NE,l);
  2404. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2405. srcref.offset:=1;
  2406. dstref.offset:=1;
  2407. case count mod size of
  2408. 1:
  2409. begin
  2410. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2411. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2412. end;
  2413. 2:
  2414. if aligned then
  2415. begin
  2416. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2417. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2418. end
  2419. else
  2420. begin
  2421. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2422. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2423. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2424. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2425. end;
  2426. 3:
  2427. if aligned then
  2428. begin
  2429. srcref.offset:=2;
  2430. dstref.offset:=2;
  2431. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2432. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2433. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2434. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2435. end
  2436. else
  2437. begin
  2438. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2439. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2440. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2441. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2442. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2443. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2444. end;
  2445. end;
  2446. { keep the registers alive }
  2447. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2448. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2449. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2450. end;
  2451. { will never be called with count<=4 }
  2452. procedure genloop_thumb(count : aword;size : byte);
  2453. procedure refincofs(const ref : treference;const value : longint = 1);
  2454. begin
  2455. a_op_const_reg(list,OP_ADD,OS_ADDR,value,ref.base);
  2456. end;
  2457. const
  2458. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2459. var
  2460. l : tasmlabel;
  2461. begin
  2462. current_asmdata.getjumplabel(l);
  2463. if count<size then size:=1;
  2464. a_load_const_reg(list,OS_INT,count div size,countreg);
  2465. cg.a_label(list,l);
  2466. r:=getintregister(list,size2opsize[size]);
  2467. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2468. refincofs(srcref);
  2469. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2470. refincofs(dstref);
  2471. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2472. list.concat(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1));
  2473. a_jmp_flags(list,F_NE,l);
  2474. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2475. case count mod size of
  2476. 1:
  2477. begin
  2478. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2479. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2480. end;
  2481. 2:
  2482. if aligned then
  2483. begin
  2484. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2485. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2486. end
  2487. else
  2488. begin
  2489. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2490. refincofs(srcref);
  2491. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2492. refincofs(dstref);
  2493. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2494. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2495. end;
  2496. 3:
  2497. if aligned then
  2498. begin
  2499. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2500. refincofs(srcref,2);
  2501. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2502. refincofs(dstref,2);
  2503. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2504. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2505. end
  2506. else
  2507. begin
  2508. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2509. refincofs(srcref);
  2510. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2511. refincofs(dstref);
  2512. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2513. refincofs(srcref);
  2514. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2515. refincofs(dstref);
  2516. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2517. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2518. end;
  2519. end;
  2520. { keep the registers alive }
  2521. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2522. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2523. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2524. end;
  2525. begin
  2526. if len=0 then
  2527. exit;
  2528. if GenerateThumbCode then
  2529. maxtmpreg:=maxtmpreg_thumb
  2530. else
  2531. maxtmpreg:=maxtmpreg_arm;
  2532. helpsize:=12+maxtmpreg*4;//52 with maxtmpreg=10
  2533. dstref:=dest;
  2534. srcref:=source;
  2535. if cs_opt_size in current_settings.optimizerswitches then
  2536. helpsize:=8;
  2537. if aligned and (len=4) then
  2538. begin
  2539. tmpreg:=getintregister(list,OS_32);
  2540. a_load_ref_reg(list,OS_32,OS_32,source,tmpreg);
  2541. a_load_reg_ref(list,OS_32,OS_32,tmpreg,dest);
  2542. end
  2543. else if aligned and (len=2) then
  2544. begin
  2545. tmpreg:=getintregister(list,OS_16);
  2546. a_load_ref_reg(list,OS_16,OS_16,source,tmpreg);
  2547. a_load_reg_ref(list,OS_16,OS_16,tmpreg,dest);
  2548. end
  2549. else if (len<=helpsize) and aligned then
  2550. begin
  2551. tmpregi:=0;
  2552. srcreg:=getintregister(list,OS_ADDR);
  2553. { explicit pc relative addressing, could be
  2554. e.g. a floating point constant }
  2555. if source.base=NR_PC then
  2556. begin
  2557. { ... then we don't need a loadaddr }
  2558. srcref:=source;
  2559. end
  2560. else
  2561. begin
  2562. a_loadaddr_ref_reg(list,source,srcreg);
  2563. reference_reset_base(srcref,srcreg,0,source.alignment,source.volatility);
  2564. end;
  2565. while (len div 4 <> 0) and (tmpregi<maxtmpreg) do
  2566. begin
  2567. inc(tmpregi);
  2568. tmpregisters[tmpregi]:=getintregister(list,OS_32);
  2569. a_load_ref_reg(list,OS_32,OS_32,srcref,tmpregisters[tmpregi]);
  2570. inc(srcref.offset,4);
  2571. dec(len,4);
  2572. end;
  2573. destreg:=getintregister(list,OS_ADDR);
  2574. a_loadaddr_ref_reg(list,dest,destreg);
  2575. reference_reset_base(dstref,destreg,0,dest.alignment,dest.volatility);
  2576. tmpregi2:=1;
  2577. while (tmpregi2<=tmpregi) do
  2578. begin
  2579. a_load_reg_ref(list,OS_32,OS_32,tmpregisters[tmpregi2],dstref);
  2580. inc(dstref.offset,4);
  2581. inc(tmpregi2);
  2582. end;
  2583. copysize:=4;
  2584. cgsize:=OS_32;
  2585. while len<>0 do
  2586. begin
  2587. if len<2 then
  2588. begin
  2589. copysize:=1;
  2590. cgsize:=OS_8;
  2591. end
  2592. else if len<4 then
  2593. begin
  2594. copysize:=2;
  2595. cgsize:=OS_16;
  2596. end;
  2597. dec(len,copysize);
  2598. r:=getintregister(list,cgsize);
  2599. a_load_ref_reg(list,cgsize,cgsize,srcref,r);
  2600. a_load_reg_ref(list,cgsize,cgsize,r,dstref);
  2601. inc(srcref.offset,copysize);
  2602. inc(dstref.offset,copysize);
  2603. end;{end of while}
  2604. end
  2605. else
  2606. begin
  2607. cgsize:=OS_32;
  2608. if (len<=4) then{len<=4 and not aligned}
  2609. begin
  2610. r:=getintregister(list,cgsize);
  2611. usedtmpref:=a_internal_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2612. if Len=1 then
  2613. a_load_reg_ref(list,OS_8,OS_8,r,dstref)
  2614. else
  2615. begin
  2616. tmpreg:=getintregister(list,cgsize);
  2617. usedtmpref2:=a_internal_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2618. inc(usedtmpref.offset,1);
  2619. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2620. inc(usedtmpref2.offset,1);
  2621. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2622. if len>2 then
  2623. begin
  2624. inc(usedtmpref.offset,1);
  2625. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2626. inc(usedtmpref2.offset,1);
  2627. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2628. if len>3 then
  2629. begin
  2630. inc(usedtmpref.offset,1);
  2631. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2632. inc(usedtmpref2.offset,1);
  2633. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2634. end;
  2635. end;
  2636. end;
  2637. end{end of if len<=4}
  2638. else
  2639. begin{unaligned & 4<len<helpsize **or** aligned/unaligned & len>helpsize}
  2640. destreg:=getintregister(list,OS_ADDR);
  2641. a_loadaddr_ref_reg(list,dest,destreg);
  2642. reference_reset_base(dstref,destreg,0,dest.alignment,dest.volatility);
  2643. srcreg:=getintregister(list,OS_ADDR);
  2644. a_loadaddr_ref_reg(list,source,srcreg);
  2645. reference_reset_base(srcref,srcreg,0,source.alignment,source.volatility);
  2646. countreg:=getintregister(list,OS_32);
  2647. // if cs_opt_size in current_settings.optimizerswitches then
  2648. { roozbeh : it seems loading 1 byte is faster becouse of caching/fetching(?) }
  2649. {if aligned then
  2650. genloop(len,4)
  2651. else}
  2652. if GenerateThumbCode then
  2653. genloop_thumb(len,1)
  2654. else
  2655. genloop(len,1);
  2656. end;
  2657. end;
  2658. end;
  2659. procedure tbasecgarm.g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);
  2660. begin
  2661. g_concatcopy_internal(list,source,dest,len,false);
  2662. end;
  2663. procedure tbasecgarm.g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);
  2664. begin
  2665. if (source.alignment in [1,3]) or
  2666. (dest.alignment in [1,3]) then
  2667. g_concatcopy_internal(list,source,dest,len,false)
  2668. else
  2669. g_concatcopy_internal(list,source,dest,len,true);
  2670. end;
  2671. procedure tbasecgarm.g_overflowCheck(list : TAsmList;const l : tlocation;def : tdef);
  2672. var
  2673. ovloc : tlocation;
  2674. begin
  2675. ovloc.loc:=LOC_VOID;
  2676. g_overflowCheck_loc(list,l,def,ovloc);
  2677. end;
  2678. procedure tbasecgarm.g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);
  2679. var
  2680. hl : tasmlabel;
  2681. ai:TAiCpu;
  2682. hflags : tresflags;
  2683. begin
  2684. if not(cs_check_overflow in current_settings.localswitches) then
  2685. exit;
  2686. current_asmdata.getjumplabel(hl);
  2687. case ovloc.loc of
  2688. LOC_VOID:
  2689. begin
  2690. ai:=taicpu.op_sym(A_B,hl);
  2691. ai.is_jmp:=true;
  2692. if not((def.typ=pointerdef) or
  2693. ((def.typ=orddef) and
  2694. (torddef(def).ordtype in [u64bit,u16bit,u32bit,u8bit,uchar,
  2695. pasbool8,pasbool16,pasbool32,pasbool64]))) then
  2696. ai.SetCondition(C_VC)
  2697. else
  2698. if TAiCpu(List.Last).opcode in [A_RSB,A_RSC,A_SBC,A_SUB] then
  2699. ai.SetCondition(C_CS)
  2700. else
  2701. ai.SetCondition(C_CC);
  2702. list.concat(ai);
  2703. end;
  2704. LOC_FLAGS:
  2705. begin
  2706. hflags:=ovloc.resflags;
  2707. inverse_flags(hflags);
  2708. cg.a_jmp_flags(list,hflags,hl);
  2709. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2710. end;
  2711. else
  2712. internalerror(200409281);
  2713. end;
  2714. a_call_name(list,'FPC_OVERFLOW',false);
  2715. a_label(list,hl);
  2716. end;
  2717. procedure tbasecgarm.g_save_registers(list : TAsmList);
  2718. begin
  2719. { this work is done in g_proc_entry }
  2720. end;
  2721. procedure tbasecgarm.g_restore_registers(list : TAsmList);
  2722. begin
  2723. { this work is done in g_proc_exit }
  2724. end;
  2725. procedure tbasecgarm.a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  2726. var
  2727. ai : taicpu;
  2728. hlabel : TAsmLabel;
  2729. begin
  2730. if GenerateThumbCode then
  2731. begin
  2732. { the optimizer has to fix this if jump range is sufficient short }
  2733. current_asmdata.getjumplabel(hlabel);
  2734. ai:=Taicpu.Op_sym(A_B,hlabel);
  2735. ai.SetCondition(inverse_cond(OpCmp2AsmCond[cond]));
  2736. ai.is_jmp:=true;
  2737. list.concat(ai);
  2738. a_jmp_always(list,l);
  2739. a_label(list,hlabel);
  2740. end
  2741. else
  2742. begin
  2743. ai:=Taicpu.Op_sym(A_B,l);
  2744. ai.SetCondition(OpCmp2AsmCond[cond]);
  2745. ai.is_jmp:=true;
  2746. list.concat(ai);
  2747. end;
  2748. end;
  2749. function get_scalar_mm_op(fromsize,tosize : tcgsize) : tasmop;
  2750. const
  2751. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of tasmop = (
  2752. (A_VMOV,A_VCVT,A_NONE,A_NONE,A_NONE),
  2753. (A_VCVT,A_VMOV,A_NONE,A_NONE,A_NONE),
  2754. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2755. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2756. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE));
  2757. begin
  2758. result:=convertop[fromsize,tosize];
  2759. if result=A_NONE then
  2760. internalerror(200312205);
  2761. end;
  2762. function get_scalar_mm_prefix(fromsize,tosize : tcgsize) : TOpPostfix;
  2763. const
  2764. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of TOpPostfix = (
  2765. (PF_F32, PF_F32F64,PF_None,PF_None,PF_None),
  2766. (PF_F64F32,PF_F64, PF_None,PF_None,PF_None),
  2767. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2768. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2769. (PF_None, PF_None, PF_None,PF_None,PF_None));
  2770. begin
  2771. result:=convertop[fromsize,tosize];
  2772. end;
  2773. procedure tbasecgarm.a_loadmm_reg_reg(list: tasmlist; fromsize,tosize: tcgsize; reg1,reg2: tregister; shuffle: pmmshuffle);
  2774. var
  2775. instr: taicpu;
  2776. begin
  2777. if (shuffle=nil) or shufflescalar(shuffle) then
  2778. instr:=setoppostfix(taicpu.op_reg_reg(get_scalar_mm_op(tosize,fromsize),reg2,reg1),get_scalar_mm_prefix(tosize,fromsize))
  2779. else
  2780. internalerror(2009112407);
  2781. list.concat(instr);
  2782. case instr.opcode of
  2783. A_VMOV:
  2784. add_move_instruction(instr);
  2785. end;
  2786. end;
  2787. procedure tbasecgarm.a_loadmm_ref_reg(list: tasmlist; fromsize,tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  2788. var
  2789. intreg,
  2790. tmpmmreg : tregister;
  2791. reg64 : tregister64;
  2792. begin
  2793. if assigned(shuffle) and
  2794. not(shufflescalar(shuffle)) then
  2795. internalerror(2009112413);
  2796. case fromsize of
  2797. OS_32,OS_S32:
  2798. begin
  2799. fromsize:=OS_F32;
  2800. { since we are loading an integer, no conversion may be required }
  2801. if (fromsize<>tosize) then
  2802. internalerror(2009112801);
  2803. end;
  2804. OS_64,OS_S64:
  2805. begin
  2806. fromsize:=OS_F64;
  2807. { since we are loading an integer, no conversion may be required }
  2808. if (fromsize<>tosize) then
  2809. internalerror(2009112901);
  2810. end;
  2811. end;
  2812. if (fromsize<>tosize) then
  2813. tmpmmreg:=getmmregister(list,fromsize)
  2814. else
  2815. tmpmmreg:=reg;
  2816. if (ref.alignment in [1,2]) then
  2817. begin
  2818. case fromsize of
  2819. OS_F32:
  2820. begin
  2821. intreg:=getintregister(list,OS_32);
  2822. a_load_ref_reg(list,OS_32,OS_32,ref,intreg);
  2823. a_loadmm_intreg_reg(list,OS_32,OS_F32,intreg,tmpmmreg,mms_movescalar);
  2824. end;
  2825. OS_F64:
  2826. begin
  2827. reg64.reglo:=getintregister(list,OS_32);
  2828. reg64.reghi:=getintregister(list,OS_32);
  2829. cg64.a_load64_ref_reg(list,ref,reg64);
  2830. cg64.a_loadmm_intreg64_reg(list,OS_F64,reg64,tmpmmreg);
  2831. end;
  2832. else
  2833. internalerror(2009112412);
  2834. end;
  2835. end
  2836. else
  2837. begin
  2838. handle_load_store(list,A_VLDR,PF_None,tmpmmreg,ref);
  2839. end;
  2840. if (tmpmmreg<>reg) then
  2841. a_loadmm_reg_reg(list,fromsize,tosize,tmpmmreg,reg,shuffle);
  2842. end;
  2843. procedure tbasecgarm.a_loadmm_reg_ref(list: tasmlist; fromsize,tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  2844. var
  2845. intreg,
  2846. tmpmmreg : tregister;
  2847. reg64 : tregister64;
  2848. begin
  2849. if assigned(shuffle) and
  2850. not(shufflescalar(shuffle)) then
  2851. internalerror(2009112416);
  2852. case tosize of
  2853. OS_32,OS_S32:
  2854. begin
  2855. tosize:=OS_F32;
  2856. { since we are loading an integer, no conversion may be required }
  2857. if (fromsize<>tosize) then
  2858. internalerror(2009112801);
  2859. end;
  2860. OS_64,OS_S64:
  2861. begin
  2862. tosize:=OS_F64;
  2863. { since we are loading an integer, no conversion may be required }
  2864. if (fromsize<>tosize) then
  2865. internalerror(2009112901);
  2866. end;
  2867. end;
  2868. if (fromsize<>tosize) then
  2869. begin
  2870. tmpmmreg:=getmmregister(list,tosize);
  2871. a_loadmm_reg_reg(list,fromsize,tosize,reg,tmpmmreg,shuffle);
  2872. end
  2873. else
  2874. tmpmmreg:=reg;
  2875. if (ref.alignment in [1,2]) then
  2876. begin
  2877. case tosize of
  2878. OS_F32:
  2879. begin
  2880. intreg:=getintregister(list,OS_32);
  2881. a_loadmm_reg_intreg(list,OS_F32,OS_32,tmpmmreg,intreg,shuffle);
  2882. a_load_reg_ref(list,OS_32,OS_32,intreg,ref);
  2883. end;
  2884. OS_F64:
  2885. begin
  2886. reg64.reglo:=getintregister(list,OS_32);
  2887. reg64.reghi:=getintregister(list,OS_32);
  2888. cg64.a_loadmm_reg_intreg64(list,OS_F64,tmpmmreg,reg64);
  2889. cg64.a_load64_reg_ref(list,reg64,ref);
  2890. end;
  2891. else
  2892. internalerror(2009112417);
  2893. end;
  2894. end
  2895. else
  2896. begin
  2897. handle_load_store(list,A_VSTR,PF_None,tmpmmreg,ref);
  2898. end;
  2899. end;
  2900. procedure tbasecgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  2901. begin
  2902. { this code can only be used to transfer raw data, not to perform
  2903. conversions }
  2904. if (tosize<>OS_F32) then
  2905. internalerror(2009112419);
  2906. if not(fromsize in [OS_32,OS_S32]) then
  2907. internalerror(2009112420);
  2908. if assigned(shuffle) and
  2909. not shufflescalar(shuffle) then
  2910. internalerror(2009112516);
  2911. list.concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg));
  2912. end;
  2913. procedure tbasecgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize; mmreg, intreg: tregister;shuffle : pmmshuffle);
  2914. begin
  2915. { this code can only be used to transfer raw data, not to perform
  2916. conversions }
  2917. if (fromsize<>OS_F32) then
  2918. internalerror(2009112430);
  2919. if not(tosize in [OS_32,OS_S32]) then
  2920. internalerror(2009112420);
  2921. if assigned(shuffle) and
  2922. not shufflescalar(shuffle) then
  2923. internalerror(2009112514);
  2924. list.concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg));
  2925. end;
  2926. procedure tbasecgarm.a_opmm_reg_reg(list: tasmlist; op: topcg; size: tcgsize; src, dst: tregister; shuffle: pmmshuffle);
  2927. var
  2928. tmpreg: tregister;
  2929. begin
  2930. { the vfp doesn't support xor nor any other logical operation, but
  2931. this routine is used to initialise global mm regvars. We can
  2932. easily initialise an mm reg with 0 though. }
  2933. case op of
  2934. OP_XOR:
  2935. begin
  2936. if (src<>dst) or
  2937. (reg_cgsize(src)<>size) or
  2938. assigned(shuffle) then
  2939. internalerror(2009112907);
  2940. tmpreg:=getintregister(list,OS_32);
  2941. a_load_const_reg(list,OS_32,0,tmpreg);
  2942. case size of
  2943. OS_F32:
  2944. list.concat(taicpu.op_reg_reg(A_VMOV,dst,tmpreg));
  2945. OS_F64:
  2946. list.concat(taicpu.op_reg_reg_reg(A_VMOV,dst,tmpreg,tmpreg));
  2947. else
  2948. internalerror(2009112908);
  2949. end;
  2950. end
  2951. else
  2952. internalerror(2009112906);
  2953. end;
  2954. end;
  2955. procedure tbasecgarm.maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  2956. const
  2957. overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NEG];
  2958. begin
  2959. if (op in overflowops) and
  2960. (size in [OS_8,OS_S8,OS_16,OS_S16]) then
  2961. a_load_reg_reg(list,OS_32,size,dst,dst);
  2962. end;
  2963. procedure tbasecgarm.safe_mla(list : TAsmList; op1,op2,op3,op4 : TRegister);
  2964. procedure checkreg(var reg : TRegister);
  2965. var
  2966. tmpreg : TRegister;
  2967. begin
  2968. if ((GenerateThumbCode or GenerateThumb2Code) and (getsupreg(reg)=RS_R13)) or
  2969. (getsupreg(reg)=RS_R15) then
  2970. begin
  2971. tmpreg:=getintregister(list,OS_INT);
  2972. a_load_reg_reg(list,OS_INT,OS_INT,reg,tmpreg);
  2973. reg:=tmpreg;
  2974. end;
  2975. end;
  2976. begin
  2977. checkreg(op1);
  2978. checkreg(op2);
  2979. checkreg(op3);
  2980. checkreg(op4);
  2981. list.concat(taicpu.op_reg_reg_reg_reg(A_MLA,op1,op2,op3,op4));
  2982. end;
  2983. procedure tcg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  2984. begin
  2985. case op of
  2986. OP_NEG:
  2987. begin
  2988. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2989. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  2990. list.concat(taicpu.op_reg_reg_const(A_RSC,regdst.reghi,regsrc.reghi,0));
  2991. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2992. end;
  2993. OP_NOT:
  2994. begin
  2995. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  2996. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  2997. end;
  2998. else
  2999. a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);
  3000. end;
  3001. end;
  3002. procedure tcg64farm.a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);
  3003. begin
  3004. a_op64_const_reg_reg(list,op,size,value,reg,reg);
  3005. end;
  3006. procedure tcg64farm.a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);
  3007. var
  3008. ovloc : tlocation;
  3009. begin
  3010. a_op64_const_reg_reg_checkoverflow(list,op,size,value,regsrc,regdst,false,ovloc);
  3011. end;
  3012. procedure tcg64farm.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);
  3013. var
  3014. ovloc : tlocation;
  3015. begin
  3016. a_op64_reg_reg_reg_checkoverflow(list,op,size,regsrc1,regsrc2,regdst,false,ovloc);
  3017. end;
  3018. procedure tcg64farm.a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);
  3019. begin
  3020. { this code can only be used to transfer raw data, not to perform
  3021. conversions }
  3022. if (mmsize<>OS_F64) then
  3023. internalerror(2009112405);
  3024. list.concat(taicpu.op_reg_reg_reg(A_VMOV,mmreg,intreg.reglo,intreg.reghi));
  3025. end;
  3026. procedure tcg64farm.a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);
  3027. begin
  3028. { this code can only be used to transfer raw data, not to perform
  3029. conversions }
  3030. if (mmsize<>OS_F64) then
  3031. internalerror(2009112406);
  3032. list.concat(taicpu.op_reg_reg_reg(A_VMOV,intreg.reglo,intreg.reghi,mmreg));
  3033. end;
  3034. procedure tcg64farm.a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3035. var
  3036. tmpreg : tregister;
  3037. b : byte;
  3038. begin
  3039. ovloc.loc:=LOC_VOID;
  3040. case op of
  3041. OP_NEG,
  3042. OP_NOT :
  3043. internalerror(2012022501);
  3044. end;
  3045. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3046. begin
  3047. case op of
  3048. OP_ADD:
  3049. begin
  3050. if is_shifter_const(lo(value),b) then
  3051. begin
  3052. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3053. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3054. end
  3055. else
  3056. begin
  3057. tmpreg:=cg.getintregister(list,OS_32);
  3058. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3059. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3060. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3061. end;
  3062. if is_shifter_const(hi(value),b) then
  3063. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,hi(value)),PF_S))
  3064. else
  3065. begin
  3066. tmpreg:=cg.getintregister(list,OS_32);
  3067. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3068. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3069. end;
  3070. end;
  3071. OP_SUB:
  3072. begin
  3073. if is_shifter_const(lo(value),b) then
  3074. begin
  3075. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3076. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3077. end
  3078. else
  3079. begin
  3080. tmpreg:=cg.getintregister(list,OS_32);
  3081. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3082. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3083. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3084. end;
  3085. if is_shifter_const(hi(value),b) then
  3086. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))),PF_S))
  3087. else
  3088. begin
  3089. tmpreg:=cg.getintregister(list,OS_32);
  3090. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3091. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3092. end;
  3093. end;
  3094. else
  3095. internalerror(200502131);
  3096. end;
  3097. if size=OS_64 then
  3098. begin
  3099. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3100. ovloc.loc:=LOC_FLAGS;
  3101. case op of
  3102. OP_ADD:
  3103. ovloc.resflags:=F_CS;
  3104. OP_SUB:
  3105. ovloc.resflags:=F_CC;
  3106. end;
  3107. end;
  3108. end
  3109. else
  3110. begin
  3111. case op of
  3112. OP_AND,OP_OR,OP_XOR:
  3113. begin
  3114. cg.a_op_const_reg_reg(list,op,OS_32,aint(lo(value)),regsrc.reglo,regdst.reglo);
  3115. cg.a_op_const_reg_reg(list,op,OS_32,aint(hi(value)),regsrc.reghi,regdst.reghi);
  3116. end;
  3117. OP_ADD:
  3118. begin
  3119. if is_shifter_const(aint(lo(value)),b) then
  3120. begin
  3121. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3122. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3123. end
  3124. else
  3125. begin
  3126. tmpreg:=cg.getintregister(list,OS_32);
  3127. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3128. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3129. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3130. end;
  3131. if is_shifter_const(aint(hi(value)),b) then
  3132. list.concat(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3133. else
  3134. begin
  3135. tmpreg:=cg.getintregister(list,OS_32);
  3136. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  3137. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg));
  3138. end;
  3139. end;
  3140. OP_SUB:
  3141. begin
  3142. if is_shifter_const(aint(lo(value)),b) then
  3143. begin
  3144. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3145. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3146. end
  3147. else
  3148. begin
  3149. tmpreg:=cg.getintregister(list,OS_32);
  3150. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3151. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3152. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3153. end;
  3154. if is_shifter_const(aint(hi(value)),b) then
  3155. list.concat(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3156. else
  3157. begin
  3158. tmpreg:=cg.getintregister(list,OS_32);
  3159. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3160. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg));
  3161. end;
  3162. end;
  3163. else
  3164. internalerror(2003083101);
  3165. end;
  3166. end;
  3167. end;
  3168. procedure tcg64farm.a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3169. begin
  3170. ovloc.loc:=LOC_VOID;
  3171. case op of
  3172. OP_NEG,
  3173. OP_NOT :
  3174. internalerror(2012022502);
  3175. end;
  3176. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3177. begin
  3178. case op of
  3179. OP_ADD:
  3180. begin
  3181. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3182. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3183. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi),PF_S));
  3184. end;
  3185. OP_SUB:
  3186. begin
  3187. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3188. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3189. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi),PF_S));
  3190. end;
  3191. else
  3192. internalerror(2003083101);
  3193. end;
  3194. if size=OS_64 then
  3195. begin
  3196. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3197. ovloc.loc:=LOC_FLAGS;
  3198. case op of
  3199. OP_ADD:
  3200. ovloc.resflags:=F_CS;
  3201. OP_SUB:
  3202. ovloc.resflags:=F_CC;
  3203. end;
  3204. end;
  3205. end
  3206. else
  3207. begin
  3208. case op of
  3209. OP_AND,OP_OR,OP_XOR:
  3210. begin
  3211. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);
  3212. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);
  3213. end;
  3214. OP_ADD:
  3215. begin
  3216. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3217. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3218. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi));
  3219. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3220. end;
  3221. OP_SUB:
  3222. begin
  3223. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3224. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3225. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi));
  3226. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3227. end;
  3228. else
  3229. internalerror(2003083101);
  3230. end;
  3231. end;
  3232. end;
  3233. procedure tthumbcgarm.init_register_allocators;
  3234. begin
  3235. inherited init_register_allocators;
  3236. if assigned(current_procinfo) and (current_procinfo.framepointer=NR_R7) then
  3237. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3238. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6],first_int_imreg,[])
  3239. else
  3240. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3241. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7],first_int_imreg,[]);
  3242. end;
  3243. procedure tthumbcgarm.done_register_allocators;
  3244. begin
  3245. rg[R_INTREGISTER].free;
  3246. rg[R_FPUREGISTER].free;
  3247. rg[R_MMREGISTER].free;
  3248. inherited done_register_allocators;
  3249. end;
  3250. procedure tthumbcgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  3251. var
  3252. ref : treference;
  3253. r : byte;
  3254. regs : tcpuregisterset;
  3255. stackmisalignment : pint;
  3256. registerarea: DWord;
  3257. stack_parameters: Boolean;
  3258. begin
  3259. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3260. LocalSize:=align(LocalSize,4);
  3261. { call instruction does not put anything on the stack }
  3262. stackmisalignment:=0;
  3263. if not(nostackframe) then
  3264. begin
  3265. a_reg_alloc(list,NR_STACK_POINTER_REG);
  3266. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3267. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  3268. { save int registers }
  3269. reference_reset(ref,4,[]);
  3270. ref.index:=NR_STACK_POINTER_REG;
  3271. ref.addressmode:=AM_PREINDEXED;
  3272. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3273. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3274. begin
  3275. //!!!! a_reg_alloc(list,NR_R12);
  3276. //!!!! list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  3277. end;
  3278. { the (old) ARM APCS requires saving both the stack pointer (to
  3279. crawl the stack) and the PC (to identify the function this
  3280. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  3281. and R15 -- still needs updating for EABI and Darwin, they don't
  3282. need that }
  3283. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3284. regs:=regs+[RS_R7,RS_R14]
  3285. else
  3286. // if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  3287. include(regs,RS_R14);
  3288. { safely estimate stack size }
  3289. if localsize+current_settings.alignment.localalignmax+4>508 then
  3290. begin
  3291. include(rg[R_INTREGISTER].used_in_proc,RS_R4);
  3292. include(regs,RS_R4);
  3293. end;
  3294. registerarea:=0;
  3295. if regs<>[] then
  3296. begin
  3297. for r:=RS_R0 to RS_R15 do
  3298. if r in regs then
  3299. inc(registerarea,4);
  3300. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,regs));
  3301. end;
  3302. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3303. if stack_parameters or (LocalSize<>0) or
  3304. ((stackmisalignment<>0) and
  3305. ((pi_do_call in current_procinfo.flags) or
  3306. (po_assembler in current_procinfo.procdef.procoptions))) then
  3307. begin
  3308. { do we access stack parameters?
  3309. if yes, the previously estimated stacksize must be used }
  3310. if stack_parameters then
  3311. begin
  3312. if localsize>tcpuprocinfo(current_procinfo).stackframesize then
  3313. begin
  3314. writeln(localsize);
  3315. writeln(tcpuprocinfo(current_procinfo).stackframesize);
  3316. internalerror(2013040601);
  3317. end
  3318. else
  3319. localsize:=tcpuprocinfo(current_procinfo).stackframesize-registerarea;
  3320. end
  3321. else
  3322. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3323. if localsize<508 then
  3324. begin
  3325. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  3326. end
  3327. else if localsize<=1016 then
  3328. begin
  3329. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3330. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize-508));
  3331. end
  3332. else
  3333. begin
  3334. a_load_const_reg(list,OS_ADDR,-localsize,NR_R4);
  3335. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R4));
  3336. include(regs,RS_R4);
  3337. //!!!! if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  3338. //!!!! a_reg_alloc(list,NR_R12);
  3339. //!!!! a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  3340. //!!!! list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  3341. //!!!! a_reg_dealloc(list,NR_R12);
  3342. end;
  3343. end;
  3344. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3345. begin
  3346. list.concat(taicpu.op_reg_reg_const(A_ADD,current_procinfo.framepointer,NR_STACK_POINTER_REG,0));
  3347. end;
  3348. end;
  3349. end;
  3350. procedure tthumbcgarm.g_proc_exit(list: TAsmList; parasize: longint; nostackframe: boolean);
  3351. var
  3352. LocalSize : longint;
  3353. r: byte;
  3354. regs : tcpuregisterset;
  3355. registerarea : DWord;
  3356. stackmisalignment: pint;
  3357. stack_parameters : Boolean;
  3358. begin
  3359. if not(nostackframe) then
  3360. begin
  3361. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3362. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3363. include(regs,RS_R15);
  3364. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3365. include(regs,getsupreg(current_procinfo.framepointer));
  3366. registerarea:=0;
  3367. for r:=RS_R0 to RS_R15 do
  3368. if r in regs then
  3369. inc(registerarea,4);
  3370. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3371. LocalSize:=current_procinfo.calc_stackframe_size;
  3372. if stack_parameters then
  3373. localsize:=tcpuprocinfo(current_procinfo).stackframesize-registerarea
  3374. else
  3375. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3376. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  3377. (target_info.system in systems_darwin) then
  3378. begin
  3379. if (LocalSize<>0) or
  3380. ((stackmisalignment<>0) and
  3381. ((pi_do_call in current_procinfo.flags) or
  3382. (po_assembler in current_procinfo.procdef.procoptions))) then
  3383. begin
  3384. if LocalSize=0 then
  3385. else if LocalSize<=508 then
  3386. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  3387. else if LocalSize<=1016 then
  3388. begin
  3389. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3390. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,localsize-508));
  3391. end
  3392. else
  3393. begin
  3394. a_reg_alloc(list,NR_R3);
  3395. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R3);
  3396. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R3));
  3397. a_reg_dealloc(list,NR_R3);
  3398. end;
  3399. end;
  3400. if regs=[] then
  3401. begin
  3402. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3403. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3404. else
  3405. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3406. end
  3407. else
  3408. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,regs));
  3409. end;
  3410. end
  3411. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3412. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3413. else
  3414. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3415. end;
  3416. procedure tthumbcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3417. var
  3418. oppostfix:toppostfix;
  3419. usedtmpref: treference;
  3420. tmpreg,tmpreg2 : tregister;
  3421. dir : integer;
  3422. begin
  3423. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3424. FromSize := ToSize;
  3425. case FromSize of
  3426. { signed integer registers }
  3427. OS_8:
  3428. oppostfix:=PF_B;
  3429. OS_S8:
  3430. oppostfix:=PF_SB;
  3431. OS_16:
  3432. oppostfix:=PF_H;
  3433. OS_S16:
  3434. oppostfix:=PF_SH;
  3435. OS_32,
  3436. OS_S32:
  3437. oppostfix:=PF_None;
  3438. else
  3439. InternalError(200308298);
  3440. end;
  3441. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3442. begin
  3443. if target_info.endian=endian_big then
  3444. dir:=-1
  3445. else
  3446. dir:=1;
  3447. case FromSize of
  3448. OS_16,OS_S16:
  3449. begin
  3450. { only complicated references need an extra loadaddr }
  3451. if assigned(ref.symbol) or
  3452. (ref.index<>NR_NO) or
  3453. (ref.offset<-124) or
  3454. (ref.offset>124) or
  3455. { sometimes the compiler reused registers }
  3456. (reg=ref.index) or
  3457. (reg=ref.base) then
  3458. begin
  3459. tmpreg2:=getintregister(list,OS_INT);
  3460. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3461. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment,ref.volatility);
  3462. end
  3463. else
  3464. usedtmpref:=ref;
  3465. if target_info.endian=endian_big then
  3466. inc(usedtmpref.offset,1);
  3467. tmpreg:=getintregister(list,OS_INT);
  3468. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3469. inc(usedtmpref.offset,dir);
  3470. if FromSize=OS_16 then
  3471. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3472. else
  3473. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3474. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3475. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3476. end;
  3477. OS_32,OS_S32:
  3478. begin
  3479. tmpreg:=getintregister(list,OS_INT);
  3480. { only complicated references need an extra loadaddr }
  3481. if assigned(ref.symbol) or
  3482. (ref.index<>NR_NO) or
  3483. (ref.offset<-124) or
  3484. (ref.offset>124) or
  3485. { sometimes the compiler reused registers }
  3486. (reg=ref.index) or
  3487. (reg=ref.base) then
  3488. begin
  3489. tmpreg2:=getintregister(list,OS_INT);
  3490. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3491. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment,ref.volatility);
  3492. end
  3493. else
  3494. usedtmpref:=ref;
  3495. if ref.alignment=2 then
  3496. begin
  3497. if target_info.endian=endian_big then
  3498. inc(usedtmpref.offset,2);
  3499. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  3500. inc(usedtmpref.offset,dir*2);
  3501. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  3502. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3503. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3504. end
  3505. else
  3506. begin
  3507. if target_info.endian=endian_big then
  3508. inc(usedtmpref.offset,3);
  3509. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3510. inc(usedtmpref.offset,dir);
  3511. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3512. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3513. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3514. inc(usedtmpref.offset,dir);
  3515. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3516. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3517. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3518. inc(usedtmpref.offset,dir);
  3519. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3520. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,24));
  3521. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3522. end;
  3523. end
  3524. else
  3525. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3526. end;
  3527. end
  3528. else
  3529. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3530. if (fromsize=OS_S8) and (tosize = OS_16) then
  3531. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  3532. end;
  3533. procedure tthumbcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3534. var
  3535. l : tasmlabel;
  3536. hr : treference;
  3537. begin
  3538. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3539. internalerror(2002090902);
  3540. if is_thumb_imm(a) then
  3541. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3542. else
  3543. begin
  3544. reference_reset(hr,4,[]);
  3545. current_asmdata.getjumplabel(l);
  3546. cg.a_label(current_procinfo.aktlocaldata,l);
  3547. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3548. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3549. hr.symbol:=l;
  3550. hr.base:=NR_PC;
  3551. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3552. end;
  3553. end;
  3554. procedure tthumbcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  3555. var
  3556. hsym : tsym;
  3557. href,
  3558. tmpref : treference;
  3559. paraloc : Pcgparalocation;
  3560. l : TAsmLabel;
  3561. begin
  3562. { calculate the parameter info for the procdef }
  3563. procdef.init_paraloc_info(callerside);
  3564. hsym:=tsym(procdef.parast.Find('self'));
  3565. if not(assigned(hsym) and
  3566. (hsym.typ=paravarsym)) then
  3567. internalerror(200305251);
  3568. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  3569. while paraloc<>nil do
  3570. with paraloc^ do
  3571. begin
  3572. case loc of
  3573. LOC_REGISTER:
  3574. begin
  3575. if is_thumb_imm(ioffset) then
  3576. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  3577. else
  3578. begin
  3579. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3580. reference_reset(tmpref,4,[]);
  3581. current_asmdata.getjumplabel(l);
  3582. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3583. cg.a_label(current_procinfo.aktlocaldata,l);
  3584. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3585. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3586. tmpref.symbol:=l;
  3587. tmpref.base:=NR_PC;
  3588. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3589. a_op_reg_reg(list,OP_SUB,size,NR_R4,register);
  3590. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3591. end;
  3592. end;
  3593. LOC_REFERENCE:
  3594. begin
  3595. { offset in the wrapper needs to be adjusted for the stored
  3596. return address }
  3597. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),sizeof(pint),[]);
  3598. if is_thumb_imm(ioffset) then
  3599. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  3600. else
  3601. begin
  3602. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3603. reference_reset(tmpref,4,[]);
  3604. current_asmdata.getjumplabel(l);
  3605. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3606. cg.a_label(current_procinfo.aktlocaldata,l);
  3607. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3608. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3609. tmpref.symbol:=l;
  3610. tmpref.base:=NR_PC;
  3611. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3612. a_op_reg_ref(list,OP_SUB,size,NR_R4,href);
  3613. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3614. end;
  3615. end
  3616. else
  3617. internalerror(200309189);
  3618. end;
  3619. paraloc:=next;
  3620. end;
  3621. end;
  3622. function tthumbcgarm.handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference;
  3623. var
  3624. href : treference;
  3625. tmpreg : TRegister;
  3626. begin
  3627. href:=ref;
  3628. if { LDR/STR limitations }
  3629. (
  3630. (((op=A_LDR) and (oppostfix=PF_None)) or
  3631. ((op=A_STR) and (oppostfix=PF_None))) and
  3632. (ref.base<>NR_STACK_POINTER_REG) and
  3633. (abs(ref.offset)>124)
  3634. ) or
  3635. { LDRB/STRB limitations }
  3636. (
  3637. (((op=A_LDR) and (oppostfix=PF_B)) or
  3638. ((op=A_LDRB) and (oppostfix=PF_None)) or
  3639. ((op=A_STR) and (oppostfix=PF_B)) or
  3640. ((op=A_STRB) and (oppostfix=PF_None))) and
  3641. ((ref.base=NR_STACK_POINTER_REG) or
  3642. (ref.index=NR_STACK_POINTER_REG) or
  3643. (abs(ref.offset)>31)
  3644. )
  3645. ) or
  3646. { LDRH/STRH limitations }
  3647. (
  3648. (((op=A_LDR) and (oppostfix=PF_H)) or
  3649. ((op=A_LDRH) and (oppostfix=PF_None)) or
  3650. ((op=A_STR) and (oppostfix=PF_H)) or
  3651. ((op=A_STRH) and (oppostfix=PF_None))) and
  3652. ((ref.base=NR_STACK_POINTER_REG) or
  3653. (ref.index=NR_STACK_POINTER_REG) or
  3654. (abs(ref.offset)>62) or
  3655. ((abs(ref.offset) mod 2)<>0)
  3656. )
  3657. ) then
  3658. begin
  3659. tmpreg:=getintregister(list,OS_ADDR);
  3660. a_loadaddr_ref_reg(list,ref,tmpreg);
  3661. reference_reset_base(href,tmpreg,0,ref.alignment,ref.volatility);
  3662. end
  3663. else if (op=A_LDR) and
  3664. (oppostfix in [PF_None]) and
  3665. (ref.base=NR_STACK_POINTER_REG) and
  3666. (abs(ref.offset)>1020) then
  3667. begin
  3668. tmpreg:=getintregister(list,OS_ADDR);
  3669. a_loadaddr_ref_reg(list,ref,tmpreg);
  3670. reference_reset_base(href,tmpreg,0,ref.alignment,ref.volatility);
  3671. end
  3672. else if (op=A_LDR) and
  3673. ((oppostfix in [PF_SH,PF_SB]) or
  3674. (abs(ref.offset)>124)) then
  3675. begin
  3676. tmpreg:=getintregister(list,OS_ADDR);
  3677. a_loadaddr_ref_reg(list,ref,tmpreg);
  3678. reference_reset_base(href,tmpreg,0,ref.alignment,ref.volatility);
  3679. end;
  3680. Result:=inherited handle_load_store(list, op, oppostfix, reg, href);
  3681. end;
  3682. procedure tthumbcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  3683. var
  3684. tmpreg : tregister;
  3685. begin
  3686. case op of
  3687. OP_NEG:
  3688. list.concat(taicpu.op_reg_reg(A_NEG,dst,src));
  3689. OP_NOT:
  3690. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  3691. OP_DIV,OP_IDIV:
  3692. internalerror(200308284);
  3693. OP_ROL:
  3694. begin
  3695. if not(size in [OS_32,OS_S32]) then
  3696. internalerror(2008072801);
  3697. { simulate ROL by ror'ing 32-value }
  3698. tmpreg:=getintregister(list,OS_32);
  3699. a_load_const_reg(list,OS_32,32,tmpreg);
  3700. list.concat(taicpu.op_reg_reg(A_SUB,tmpreg,src));
  3701. list.concat(taicpu.op_reg_reg(A_ROR,dst,src));
  3702. end;
  3703. else
  3704. begin
  3705. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3706. list.concat(setoppostfix(
  3707. taicpu.op_reg_reg(op_reg_opcg2asmop[op],dst,src),op_reg_postfix[op]));
  3708. end;
  3709. end;
  3710. maybeadjustresult(list,op,size,dst);
  3711. end;
  3712. procedure tthumbcgarm.a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);
  3713. var
  3714. tmpreg : tregister;
  3715. {$ifdef DUMMY}
  3716. l1 : longint;
  3717. {$endif DUMMY}
  3718. begin
  3719. //!!! ovloc.loc:=LOC_VOID;
  3720. if {$ifopt R+}(a<>-2147483648) and{$endif} {!!!!!! not setflags and } is_thumb_imm(-a) then
  3721. case op of
  3722. OP_ADD:
  3723. begin
  3724. op:=OP_SUB;
  3725. a:=aint(dword(-a));
  3726. end;
  3727. OP_SUB:
  3728. begin
  3729. op:=OP_ADD;
  3730. a:=aint(dword(-a));
  3731. end
  3732. end;
  3733. if is_thumb_imm(a) and (op in [OP_ADD,OP_SUB]) then
  3734. begin
  3735. // if cgsetflags or setflags then
  3736. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3737. list.concat(setoppostfix(
  3738. taicpu.op_reg_const(op_reg_opcg2asmop[op],dst,a),op_reg_postfix[op]));
  3739. if (cgsetflags {!!! or setflags }) and (size in [OS_8,OS_16,OS_32]) then
  3740. begin
  3741. //!!! ovloc.loc:=LOC_FLAGS;
  3742. case op of
  3743. OP_ADD:
  3744. //!!! ovloc.resflags:=F_CS;
  3745. ;
  3746. OP_SUB:
  3747. //!!! ovloc.resflags:=F_CC;
  3748. ;
  3749. end;
  3750. end;
  3751. end
  3752. else
  3753. begin
  3754. { there could be added some more sophisticated optimizations }
  3755. if (op in [OP_MUL,OP_IMUL,OP_DIV,OP_IDIV]) and (a=1) then
  3756. a_load_reg_reg(list,size,size,dst,dst)
  3757. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  3758. a_load_const_reg(list,size,0,dst)
  3759. else if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  3760. a_op_reg_reg(list,OP_NEG,size,dst,dst)
  3761. { we do this here instead in the peephole optimizer because
  3762. it saves us a register }
  3763. {$ifdef DUMMY}
  3764. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  3765. a_op_const_reg_reg(list,OP_SHL,size,l1,dst,dst)
  3766. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  3767. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  3768. begin
  3769. if l1>32 then{roozbeh does this ever happen?}
  3770. internalerror(200308296);
  3771. shifterop_reset(so);
  3772. so.shiftmode:=SM_LSL;
  3773. so.shiftimm:=l1;
  3774. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,dst,so));
  3775. end
  3776. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  3777. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  3778. begin
  3779. if l1>32 then{does this ever happen?}
  3780. internalerror(201205181);
  3781. shifterop_reset(so);
  3782. so.shiftmode:=SM_LSL;
  3783. so.shiftimm:=l1;
  3784. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,dst,dst,so));
  3785. end
  3786. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,dst,dst) then
  3787. begin
  3788. { nothing to do on success }
  3789. end
  3790. {$endif DUMMY}
  3791. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  3792. Just using mov x, #0 might allow some easier optimizations down the line. }
  3793. else if (op = OP_AND) and (dword(a)=0) then
  3794. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  3795. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  3796. else if (op = OP_AND) and (not(dword(a))=0) then
  3797. // do nothing
  3798. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  3799. broader range of shifterconstants.}
  3800. {$ifdef DUMMY}
  3801. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  3802. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,not(dword(a))))
  3803. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  3804. begin
  3805. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm1));
  3806. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  3807. end
  3808. else if (op in [OP_ADD, OP_SUB, OP_OR]) and
  3809. not(cgsetflags or setflags) and
  3810. split_into_shifter_const(a, imm1, imm2) then
  3811. begin
  3812. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm1));
  3813. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  3814. end
  3815. {$endif DUMMY}
  3816. else if (op in [OP_SHL, OP_SHR, OP_SAR]) then
  3817. begin
  3818. list.concat(taicpu.op_reg_reg_const(op_reg_opcg2asmop[op],dst,dst,a));
  3819. end
  3820. else
  3821. begin
  3822. tmpreg:=getintregister(list,size);
  3823. a_load_const_reg(list,size,a,tmpreg);
  3824. a_op_reg_reg(list,op,size,tmpreg,dst);
  3825. end;
  3826. end;
  3827. maybeadjustresult(list,op,size,dst);
  3828. end;
  3829. procedure tthumbcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister);
  3830. begin
  3831. if (op=OP_ADD) and (src=NR_R13) and (dst<>NR_R13) and ((a mod 4)=0) and (a>0) and (a<=1020) then
  3832. list.concat(taicpu.op_reg_reg_const(A_ADD,dst,src,a))
  3833. else
  3834. inherited a_op_const_reg_reg(list,op,size,a,src,dst);
  3835. end;
  3836. procedure tthumbcgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  3837. var
  3838. l1,l2 : tasmlabel;
  3839. ai : taicpu;
  3840. begin
  3841. current_asmdata.getjumplabel(l1);
  3842. current_asmdata.getjumplabel(l2);
  3843. ai:=setcondition(taicpu.op_sym(A_B,l1),flags_to_cond(f));
  3844. ai.is_jmp:=true;
  3845. list.concat(ai);
  3846. list.concat(taicpu.op_reg_const(A_MOV,reg,0));
  3847. list.concat(taicpu.op_sym(A_B,l2));
  3848. cg.a_label(list,l1);
  3849. list.concat(taicpu.op_reg_const(A_MOV,reg,1));
  3850. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3851. cg.a_label(list,l2);
  3852. end;
  3853. procedure tthumb2cgarm.init_register_allocators;
  3854. begin
  3855. inherited init_register_allocators;
  3856. { currently, we save R14 always, so we can use it }
  3857. if (target_info.system<>system_arm_darwin) then
  3858. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3859. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3860. RS_R9,RS_R10,RS_R12,RS_R14],first_int_imreg,[])
  3861. else
  3862. { r9 is not available on Darwin according to the llvm code generator }
  3863. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3864. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3865. RS_R10,RS_R12,RS_R14],first_int_imreg,[]);
  3866. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  3867. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  3868. if current_settings.fputype in [fpu_vfpv3,fpu_vfpv4] then
  3869. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3870. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3871. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  3872. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3873. ],first_mm_imreg,[])
  3874. else if current_settings.fputype in [fpu_fpv4_s16,fpu_vfpv3_d16] then
  3875. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3876. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3877. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3878. ],first_mm_imreg,[])
  3879. else
  3880. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBNONE,
  3881. [RS_S0,RS_S1,RS_R2,RS_R3,RS_R4,RS_S31],first_mm_imreg,[]);
  3882. end;
  3883. procedure tthumb2cgarm.done_register_allocators;
  3884. begin
  3885. rg[R_INTREGISTER].free;
  3886. rg[R_FPUREGISTER].free;
  3887. rg[R_MMREGISTER].free;
  3888. inherited done_register_allocators;
  3889. end;
  3890. procedure tthumb2cgarm.a_call_reg(list : TAsmList;reg: tregister);
  3891. begin
  3892. list.concat(taicpu.op_reg(A_BLX, reg));
  3893. {
  3894. the compiler does not properly set this flag anymore in pass 1, and
  3895. for now we only need it after pass 2 (I hope) (JM)
  3896. if not(pi_do_call in current_procinfo.flags) then
  3897. internalerror(2003060703);
  3898. }
  3899. include(current_procinfo.flags,pi_do_call);
  3900. end;
  3901. procedure tthumb2cgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3902. var
  3903. l : tasmlabel;
  3904. hr : treference;
  3905. begin
  3906. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3907. internalerror(2002090902);
  3908. if is_thumb32_imm(a) then
  3909. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3910. else if is_thumb32_imm(not(a)) then
  3911. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  3912. else if (a and $FFFF)=a then
  3913. list.concat(taicpu.op_reg_const(A_MOVW,reg,a))
  3914. else
  3915. begin
  3916. reference_reset(hr,4,[]);
  3917. current_asmdata.getjumplabel(l);
  3918. cg.a_label(current_procinfo.aktlocaldata,l);
  3919. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3920. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3921. hr.symbol:=l;
  3922. hr.base:=NR_PC;
  3923. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3924. end;
  3925. end;
  3926. procedure tthumb2cgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3927. var
  3928. oppostfix:toppostfix;
  3929. usedtmpref: treference;
  3930. tmpreg,tmpreg2 : tregister;
  3931. so : tshifterop;
  3932. dir : integer;
  3933. begin
  3934. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3935. FromSize := ToSize;
  3936. case FromSize of
  3937. { signed integer registers }
  3938. OS_8:
  3939. oppostfix:=PF_B;
  3940. OS_S8:
  3941. oppostfix:=PF_SB;
  3942. OS_16:
  3943. oppostfix:=PF_H;
  3944. OS_S16:
  3945. oppostfix:=PF_SH;
  3946. OS_32,
  3947. OS_S32:
  3948. oppostfix:=PF_None;
  3949. else
  3950. InternalError(200308299);
  3951. end;
  3952. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3953. begin
  3954. if target_info.endian=endian_big then
  3955. dir:=-1
  3956. else
  3957. dir:=1;
  3958. case FromSize of
  3959. OS_16,OS_S16:
  3960. begin
  3961. { only complicated references need an extra loadaddr }
  3962. if assigned(ref.symbol) or
  3963. (ref.index<>NR_NO) or
  3964. (ref.offset<-255) or
  3965. (ref.offset>4094) or
  3966. { sometimes the compiler reused registers }
  3967. (reg=ref.index) or
  3968. (reg=ref.base) then
  3969. begin
  3970. tmpreg2:=getintregister(list,OS_INT);
  3971. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3972. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment,ref.volatility);
  3973. end
  3974. else
  3975. usedtmpref:=ref;
  3976. if target_info.endian=endian_big then
  3977. inc(usedtmpref.offset,1);
  3978. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  3979. tmpreg:=getintregister(list,OS_INT);
  3980. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3981. inc(usedtmpref.offset,dir);
  3982. if FromSize=OS_16 then
  3983. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3984. else
  3985. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3986. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  3987. end;
  3988. OS_32,OS_S32:
  3989. begin
  3990. tmpreg:=getintregister(list,OS_INT);
  3991. { only complicated references need an extra loadaddr }
  3992. if assigned(ref.symbol) or
  3993. (ref.index<>NR_NO) or
  3994. (ref.offset<-255) or
  3995. (ref.offset>4092) or
  3996. { sometimes the compiler reused registers }
  3997. (reg=ref.index) or
  3998. (reg=ref.base) then
  3999. begin
  4000. tmpreg2:=getintregister(list,OS_INT);
  4001. a_loadaddr_ref_reg(list,ref,tmpreg2);
  4002. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment,ref.volatility);
  4003. end
  4004. else
  4005. usedtmpref:=ref;
  4006. shifterop_reset(so);so.shiftmode:=SM_LSL;
  4007. if ref.alignment=2 then
  4008. begin
  4009. if target_info.endian=endian_big then
  4010. inc(usedtmpref.offset,2);
  4011. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  4012. inc(usedtmpref.offset,dir*2);
  4013. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  4014. so.shiftimm:=16;
  4015. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4016. end
  4017. else
  4018. begin
  4019. if target_info.endian=endian_big then
  4020. inc(usedtmpref.offset,3);
  4021. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  4022. inc(usedtmpref.offset,dir);
  4023. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4024. so.shiftimm:=8;
  4025. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4026. inc(usedtmpref.offset,dir);
  4027. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4028. so.shiftimm:=16;
  4029. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4030. inc(usedtmpref.offset,dir);
  4031. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4032. so.shiftimm:=24;
  4033. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4034. end;
  4035. end
  4036. else
  4037. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4038. end;
  4039. end
  4040. else
  4041. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4042. if (fromsize=OS_S8) and (tosize = OS_16) then
  4043. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  4044. end;
  4045. procedure tthumb2cgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  4046. begin
  4047. if op = OP_NOT then
  4048. begin
  4049. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  4050. case size of
  4051. OS_8: list.concat(taicpu.op_reg_reg(A_UXTB,dst,dst));
  4052. OS_S8: list.concat(taicpu.op_reg_reg(A_SXTB,dst,dst));
  4053. OS_16: list.concat(taicpu.op_reg_reg(A_UXTH,dst,dst));
  4054. OS_S16: list.concat(taicpu.op_reg_reg(A_SXTH,dst,dst));
  4055. end;
  4056. end
  4057. else
  4058. inherited a_op_reg_reg(list, op, size, src, dst);
  4059. end;
  4060. procedure tthumb2cgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4061. var
  4062. shift, width : byte;
  4063. tmpreg : tregister;
  4064. so : tshifterop;
  4065. l1 : longint;
  4066. begin
  4067. ovloc.loc:=LOC_VOID;
  4068. if {$ifopt R+}(a<>-2147483648) and{$endif} is_shifter_const(-a,shift) then
  4069. case op of
  4070. OP_ADD:
  4071. begin
  4072. op:=OP_SUB;
  4073. a:=aint(dword(-a));
  4074. end;
  4075. OP_SUB:
  4076. begin
  4077. op:=OP_ADD;
  4078. a:=aint(dword(-a));
  4079. end
  4080. end;
  4081. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  4082. case op of
  4083. OP_NEG,OP_NOT,
  4084. OP_DIV,OP_IDIV:
  4085. internalerror(200308285);
  4086. OP_SHL:
  4087. begin
  4088. if a>32 then
  4089. internalerror(2014020703);
  4090. if a<>0 then
  4091. begin
  4092. shifterop_reset(so);
  4093. so.shiftmode:=SM_LSL;
  4094. so.shiftimm:=a;
  4095. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4096. end
  4097. else
  4098. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4099. end;
  4100. OP_ROL:
  4101. begin
  4102. if a>32 then
  4103. internalerror(2014020704);
  4104. if a<>0 then
  4105. begin
  4106. shifterop_reset(so);
  4107. so.shiftmode:=SM_ROR;
  4108. so.shiftimm:=32-a;
  4109. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4110. end
  4111. else
  4112. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4113. end;
  4114. OP_ROR:
  4115. begin
  4116. if a>32 then
  4117. internalerror(2014020705);
  4118. if a<>0 then
  4119. begin
  4120. shifterop_reset(so);
  4121. so.shiftmode:=SM_ROR;
  4122. so.shiftimm:=a;
  4123. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4124. end
  4125. else
  4126. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4127. end;
  4128. OP_SHR:
  4129. begin
  4130. if a>32 then
  4131. internalerror(200308292);
  4132. shifterop_reset(so);
  4133. if a<>0 then
  4134. begin
  4135. so.shiftmode:=SM_LSR;
  4136. so.shiftimm:=a;
  4137. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4138. end
  4139. else
  4140. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4141. end;
  4142. OP_SAR:
  4143. begin
  4144. if a>32 then
  4145. internalerror(200308295);
  4146. if a<>0 then
  4147. begin
  4148. shifterop_reset(so);
  4149. so.shiftmode:=SM_ASR;
  4150. so.shiftimm:=a;
  4151. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4152. end
  4153. else
  4154. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4155. end;
  4156. else
  4157. if (op in [OP_SUB, OP_ADD]) and
  4158. ((a < 0) or
  4159. (a > 4095)) then
  4160. begin
  4161. tmpreg:=getintregister(list,size);
  4162. a_load_const_reg(list, size, a, tmpreg);
  4163. if cgsetflags or setflags then
  4164. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4165. list.concat(setoppostfix(
  4166. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4167. end
  4168. else
  4169. begin
  4170. if cgsetflags or setflags then
  4171. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4172. list.concat(setoppostfix(
  4173. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4174. end;
  4175. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  4176. begin
  4177. ovloc.loc:=LOC_FLAGS;
  4178. case op of
  4179. OP_ADD:
  4180. ovloc.resflags:=F_CS;
  4181. OP_SUB:
  4182. ovloc.resflags:=F_CC;
  4183. end;
  4184. end;
  4185. end
  4186. else
  4187. begin
  4188. { there could be added some more sophisticated optimizations }
  4189. if (op in [OP_MUL,OP_IMUL]) and (a=1) then
  4190. a_load_reg_reg(list,size,size,src,dst)
  4191. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  4192. a_load_const_reg(list,size,0,dst)
  4193. else if (op in [OP_IMUL]) and (a=-1) then
  4194. a_op_reg_reg(list,OP_NEG,size,src,dst)
  4195. { we do this here instead in the peephole optimizer because
  4196. it saves us a register }
  4197. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  4198. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  4199. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  4200. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  4201. begin
  4202. if l1>32 then{roozbeh does this ever happen?}
  4203. internalerror(200308296);
  4204. shifterop_reset(so);
  4205. so.shiftmode:=SM_LSL;
  4206. so.shiftimm:=l1;
  4207. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  4208. end
  4209. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  4210. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  4211. begin
  4212. if l1>32 then{does this ever happen?}
  4213. internalerror(201205181);
  4214. shifterop_reset(so);
  4215. so.shiftmode:=SM_LSL;
  4216. so.shiftimm:=l1;
  4217. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  4218. end
  4219. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  4220. begin
  4221. { nothing to do on success }
  4222. end
  4223. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  4224. Just using mov x, #0 might allow some easier optimizations down the line. }
  4225. else if (op = OP_AND) and (dword(a)=0) then
  4226. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  4227. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  4228. else if (op = OP_AND) and (not(dword(a))=0) then
  4229. list.concat(taicpu.op_reg_reg(A_MOV,dst,src))
  4230. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  4231. broader range of shifterconstants.}
  4232. {else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  4233. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))}
  4234. else if (op = OP_AND) and is_thumb32_imm(a) then
  4235. list.concat(taicpu.op_reg_reg_const(A_AND,dst,src,dword(a)))
  4236. else if (op = OP_AND) and (a = $FFFF) then
  4237. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  4238. else if (op = OP_AND) and is_thumb32_imm(not(dword(a))) then
  4239. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  4240. else if (op = OP_AND) and is_continuous_mask(not(a), shift, width) then
  4241. begin
  4242. a_load_reg_reg(list,size,size,src,dst);
  4243. list.concat(taicpu.op_reg_const_const(A_BFC,dst,shift,width))
  4244. end
  4245. else
  4246. begin
  4247. tmpreg:=getintregister(list,size);
  4248. a_load_const_reg(list,size,a,tmpreg);
  4249. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  4250. end;
  4251. end;
  4252. maybeadjustresult(list,op,size,dst);
  4253. end;
  4254. const
  4255. op_reg_reg_opcg2asmopThumb2: array[TOpCG] of tasmop =
  4256. (A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NONE,A_MVN,A_ORR,
  4257. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  4258. procedure tthumb2cgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4259. var
  4260. so : tshifterop;
  4261. tmpreg,overflowreg : tregister;
  4262. asmop : tasmop;
  4263. begin
  4264. ovloc.loc:=LOC_VOID;
  4265. case op of
  4266. OP_NEG,OP_NOT:
  4267. internalerror(200308286);
  4268. OP_ROL:
  4269. begin
  4270. if not(size in [OS_32,OS_S32]) then
  4271. internalerror(2008072801);
  4272. { simulate ROL by ror'ing 32-value }
  4273. tmpreg:=getintregister(list,OS_32);
  4274. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,32));
  4275. list.concat(taicpu.op_reg_reg_reg(A_SUB,src1,tmpreg,src1));
  4276. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4277. end;
  4278. OP_ROR:
  4279. begin
  4280. if not(size in [OS_32,OS_S32]) then
  4281. internalerror(2008072802);
  4282. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4283. end;
  4284. OP_IMUL,
  4285. OP_MUL:
  4286. begin
  4287. if cgsetflags or setflags then
  4288. begin
  4289. overflowreg:=getintregister(list,size);
  4290. if op=OP_IMUL then
  4291. asmop:=A_SMULL
  4292. else
  4293. asmop:=A_UMULL;
  4294. { the arm doesn't allow that rd and rm are the same }
  4295. if dst=src2 then
  4296. begin
  4297. if dst<>src1 then
  4298. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  4299. else
  4300. begin
  4301. tmpreg:=getintregister(list,size);
  4302. a_load_reg_reg(list,size,size,src2,dst);
  4303. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  4304. end;
  4305. end
  4306. else
  4307. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  4308. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4309. if op=OP_IMUL then
  4310. begin
  4311. shifterop_reset(so);
  4312. so.shiftmode:=SM_ASR;
  4313. so.shiftimm:=31;
  4314. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  4315. end
  4316. else
  4317. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  4318. ovloc.loc:=LOC_FLAGS;
  4319. ovloc.resflags:=F_NE;
  4320. end
  4321. else
  4322. begin
  4323. { the arm doesn't allow that rd and rm are the same }
  4324. if dst=src2 then
  4325. begin
  4326. if dst<>src1 then
  4327. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  4328. else
  4329. begin
  4330. tmpreg:=getintregister(list,size);
  4331. a_load_reg_reg(list,size,size,src2,dst);
  4332. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  4333. end;
  4334. end
  4335. else
  4336. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  4337. end;
  4338. end;
  4339. else
  4340. begin
  4341. if cgsetflags or setflags then
  4342. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4343. {$ifdef dummy}
  4344. { R13 is not allowed for certain instruction operands }
  4345. if op_reg_reg_opcg2asmopThumb2[op] in [A_ADD,A_SUB,A_AND,A_BIC,A_EOR] then
  4346. begin
  4347. if getsupreg(dst)=RS_R13 then
  4348. begin
  4349. tmpreg:=getintregister(list,OS_INT);
  4350. a_load_reg_reg(list,OS_INT,OS_INT,dst,tmpreg);
  4351. dst:=tmpreg;
  4352. end;
  4353. if getsupreg(src1)=RS_R13 then
  4354. begin
  4355. tmpreg:=getintregister(list,OS_INT);
  4356. a_load_reg_reg(list,OS_INT,OS_INT,src1,tmpreg);
  4357. src1:=tmpreg;
  4358. end;
  4359. end;
  4360. {$endif}
  4361. list.concat(setoppostfix(
  4362. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmopThumb2[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4363. end;
  4364. end;
  4365. maybeadjustresult(list,op,size,dst);
  4366. end;
  4367. procedure tthumb2cgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  4368. begin
  4369. list.concat(taicpu.op_cond(A_ITE, flags_to_cond(f)));
  4370. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  4371. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  4372. end;
  4373. procedure tthumb2cgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  4374. var
  4375. ref : treference;
  4376. shift : byte;
  4377. firstfloatreg,lastfloatreg,
  4378. r : byte;
  4379. regs : tcpuregisterset;
  4380. stackmisalignment: pint;
  4381. begin
  4382. LocalSize:=align(LocalSize,4);
  4383. { call instruction does not put anything on the stack }
  4384. stackmisalignment:=0;
  4385. if not(nostackframe) then
  4386. begin
  4387. firstfloatreg:=RS_NO;
  4388. lastfloatreg:=RS_NO;
  4389. { save floating point registers? }
  4390. for r:=RS_F0 to RS_F7 do
  4391. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4392. begin
  4393. if firstfloatreg=RS_NO then
  4394. firstfloatreg:=r;
  4395. lastfloatreg:=r;
  4396. inc(stackmisalignment,12);
  4397. end;
  4398. a_reg_alloc(list,NR_STACK_POINTER_REG);
  4399. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4400. begin
  4401. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  4402. a_reg_alloc(list,NR_R12);
  4403. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  4404. end;
  4405. { save int registers }
  4406. reference_reset(ref,4,[]);
  4407. ref.index:=NR_STACK_POINTER_REG;
  4408. ref.addressmode:=AM_PREINDEXED;
  4409. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4410. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4411. regs:=regs+[RS_FRAME_POINTER_REG,RS_R14]
  4412. else if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  4413. include(regs,RS_R14);
  4414. if regs<>[] then
  4415. begin
  4416. for r:=RS_R0 to RS_R15 do
  4417. if (r in regs) then
  4418. inc(stackmisalignment,4);
  4419. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4420. end;
  4421. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4422. begin
  4423. { the framepointer now points to the saved R15, so the saved
  4424. framepointer is at R11-12 (for get_caller_frame) }
  4425. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  4426. a_reg_dealloc(list,NR_R12);
  4427. end;
  4428. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4429. if (LocalSize<>0) or
  4430. ((stackmisalignment<>0) and
  4431. ((pi_do_call in current_procinfo.flags) or
  4432. (po_assembler in current_procinfo.procdef.procoptions))) then
  4433. begin
  4434. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4435. if not(is_shifter_const(localsize,shift)) then
  4436. begin
  4437. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  4438. a_reg_alloc(list,NR_R12);
  4439. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4440. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  4441. a_reg_dealloc(list,NR_R12);
  4442. end
  4443. else
  4444. begin
  4445. a_reg_dealloc(list,NR_R12);
  4446. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  4447. end;
  4448. end;
  4449. if firstfloatreg<>RS_NO then
  4450. begin
  4451. reference_reset(ref,4,[]);
  4452. if tg.direction*tcpuprocinfo(current_procinfo).floatregstart>=1023 then
  4453. begin
  4454. a_load_const_reg(list,OS_ADDR,-tcpuprocinfo(current_procinfo).floatregstart,NR_R12);
  4455. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4456. ref.base:=NR_R12;
  4457. end
  4458. else
  4459. begin
  4460. ref.base:=current_procinfo.framepointer;
  4461. ref.offset:=tcpuprocinfo(current_procinfo).floatregstart;
  4462. end;
  4463. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4464. lastfloatreg-firstfloatreg+1,ref));
  4465. end;
  4466. end;
  4467. end;
  4468. procedure tthumb2cgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  4469. var
  4470. ref : treference;
  4471. firstfloatreg,lastfloatreg,
  4472. r : byte;
  4473. shift : byte;
  4474. regs : tcpuregisterset;
  4475. LocalSize : longint;
  4476. stackmisalignment: pint;
  4477. begin
  4478. if not(nostackframe) then
  4479. begin
  4480. stackmisalignment:=0;
  4481. { restore floating point register }
  4482. firstfloatreg:=RS_NO;
  4483. lastfloatreg:=RS_NO;
  4484. { save floating point registers? }
  4485. for r:=RS_F0 to RS_F7 do
  4486. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4487. begin
  4488. if firstfloatreg=RS_NO then
  4489. firstfloatreg:=r;
  4490. lastfloatreg:=r;
  4491. { floating point register space is already included in
  4492. localsize below by calc_stackframe_size
  4493. inc(stackmisalignment,12);
  4494. }
  4495. end;
  4496. if firstfloatreg<>RS_NO then
  4497. begin
  4498. reference_reset(ref,4,[]);
  4499. if tg.direction*tcpuprocinfo(current_procinfo).floatregstart>=1023 then
  4500. begin
  4501. a_load_const_reg(list,OS_ADDR,-tcpuprocinfo(current_procinfo).floatregstart,NR_R12);
  4502. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4503. ref.base:=NR_R12;
  4504. end
  4505. else
  4506. begin
  4507. ref.base:=current_procinfo.framepointer;
  4508. ref.offset:=tcpuprocinfo(current_procinfo).floatregstart;
  4509. end;
  4510. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4511. lastfloatreg-firstfloatreg+1,ref));
  4512. end;
  4513. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4514. if (pi_do_call in current_procinfo.flags) or (regs<>[]) then
  4515. begin
  4516. exclude(regs,RS_R14);
  4517. include(regs,RS_R15);
  4518. end;
  4519. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  4520. regs:=regs+[RS_FRAME_POINTER_REG,RS_R15];
  4521. for r:=RS_R0 to RS_R15 do
  4522. if (r in regs) then
  4523. inc(stackmisalignment,4);
  4524. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4525. LocalSize:=current_procinfo.calc_stackframe_size;
  4526. if (LocalSize<>0) or
  4527. ((stackmisalignment<>0) and
  4528. ((pi_do_call in current_procinfo.flags) or
  4529. (po_assembler in current_procinfo.procdef.procoptions))) then
  4530. begin
  4531. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4532. if not(is_shifter_const(LocalSize,shift)) then
  4533. begin
  4534. a_reg_alloc(list,NR_R12);
  4535. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4536. list.concat(taicpu.op_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_R12));
  4537. a_reg_dealloc(list,NR_R12);
  4538. end
  4539. else
  4540. begin
  4541. a_reg_dealloc(list,NR_R12);
  4542. list.concat(taicpu.op_reg_const(A_ADD,NR_STACK_POINTER_REG,LocalSize));
  4543. end;
  4544. end;
  4545. if regs=[] then
  4546. list.concat(taicpu.op_reg_reg(A_MOV,NR_R15,NR_R14))
  4547. else
  4548. begin
  4549. reference_reset(ref,4,[]);
  4550. ref.index:=NR_STACK_POINTER_REG;
  4551. ref.addressmode:=AM_PREINDEXED;
  4552. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4553. end;
  4554. end
  4555. else
  4556. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14));
  4557. end;
  4558. function tthumb2cgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  4559. var
  4560. tmpreg : tregister;
  4561. tmpref : treference;
  4562. l : tasmlabel;
  4563. begin
  4564. tmpreg:=NR_NO;
  4565. { Be sure to have a base register }
  4566. if (ref.base=NR_NO) then
  4567. begin
  4568. if ref.shiftmode<>SM_None then
  4569. internalerror(2014020706);
  4570. ref.base:=ref.index;
  4571. ref.index:=NR_NO;
  4572. end;
  4573. { absolute symbols can't be handled directly, we've to store the symbol reference
  4574. in the text segment and access it pc relative
  4575. For now, we assume that references where base or index equals to PC are already
  4576. relative, all other references are assumed to be absolute and thus they need
  4577. to be handled extra.
  4578. A proper solution would be to change refoptions to a set and store the information
  4579. if the symbol is absolute or relative there.
  4580. }
  4581. if (assigned(ref.symbol) and
  4582. not(is_pc(ref.base)) and
  4583. not(is_pc(ref.index))
  4584. ) or
  4585. { [#xxx] isn't a valid address operand }
  4586. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  4587. //(ref.offset<-4095) or
  4588. (ref.offset<-255) or
  4589. (ref.offset>4095) or
  4590. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  4591. ((ref.offset<-255) or
  4592. (ref.offset>255)
  4593. )
  4594. ) or
  4595. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  4596. ((ref.offset<-1020) or
  4597. (ref.offset>1020) or
  4598. ((abs(ref.offset) mod 4)<>0) or
  4599. { the usual pc relative symbol handling assumes possible offsets of +/- 4095 }
  4600. assigned(ref.symbol)
  4601. )
  4602. ) then
  4603. begin
  4604. reference_reset(tmpref,4,[]);
  4605. { load symbol }
  4606. tmpreg:=getintregister(list,OS_INT);
  4607. if assigned(ref.symbol) then
  4608. begin
  4609. current_asmdata.getjumplabel(l);
  4610. cg.a_label(current_procinfo.aktlocaldata,l);
  4611. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  4612. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset));
  4613. { load consts entry }
  4614. tmpref.symbol:=l;
  4615. tmpref.base:=NR_R15;
  4616. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  4617. { in case of LDF/STF, we got rid of the NR_R15 }
  4618. if is_pc(ref.base) then
  4619. ref.base:=NR_NO;
  4620. if is_pc(ref.index) then
  4621. ref.index:=NR_NO;
  4622. end
  4623. else
  4624. a_load_const_reg(list,OS_ADDR,ref.offset,tmpreg);
  4625. if (ref.base<>NR_NO) then
  4626. begin
  4627. if ref.index<>NR_NO then
  4628. begin
  4629. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4630. ref.base:=tmpreg;
  4631. end
  4632. else
  4633. begin
  4634. ref.index:=tmpreg;
  4635. ref.shiftimm:=0;
  4636. ref.signindex:=1;
  4637. ref.shiftmode:=SM_None;
  4638. end;
  4639. end
  4640. else
  4641. ref.base:=tmpreg;
  4642. ref.offset:=0;
  4643. ref.symbol:=nil;
  4644. end;
  4645. if (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  4646. begin
  4647. if tmpreg<>NR_NO then
  4648. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg,tmpreg)
  4649. else
  4650. begin
  4651. tmpreg:=getintregister(list,OS_ADDR);
  4652. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg);
  4653. ref.base:=tmpreg;
  4654. end;
  4655. ref.offset:=0;
  4656. end;
  4657. { Hack? Thumb2 doesn't allow PC indexed addressing modes(although it does in the specification) }
  4658. if (ref.base=NR_R15) and (ref.index<>NR_NO) and (ref.shiftmode <> sm_none) then
  4659. begin
  4660. tmpreg:=getintregister(list,OS_ADDR);
  4661. list.concat(taicpu.op_reg_reg(A_MOV, tmpreg, NR_R15));
  4662. ref.base := tmpreg;
  4663. end;
  4664. { floating point operations have only limited references
  4665. we expect here, that a base is already set }
  4666. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  4667. begin
  4668. if ref.shiftmode<>SM_none then
  4669. internalerror(200309121);
  4670. if tmpreg<>NR_NO then
  4671. begin
  4672. if ref.base=tmpreg then
  4673. begin
  4674. if ref.signindex<0 then
  4675. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,tmpreg,ref.index))
  4676. else
  4677. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,tmpreg,ref.index));
  4678. ref.index:=NR_NO;
  4679. end
  4680. else
  4681. begin
  4682. if ref.index<>tmpreg then
  4683. internalerror(200403161);
  4684. if ref.signindex<0 then
  4685. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,ref.base,tmpreg))
  4686. else
  4687. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4688. ref.base:=tmpreg;
  4689. ref.index:=NR_NO;
  4690. end;
  4691. end
  4692. else
  4693. begin
  4694. tmpreg:=getintregister(list,OS_ADDR);
  4695. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));
  4696. ref.base:=tmpreg;
  4697. ref.index:=NR_NO;
  4698. end;
  4699. end;
  4700. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  4701. Result := ref;
  4702. end;
  4703. procedure tthumb2cgarm.a_loadmm_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister; shuffle: pmmshuffle);
  4704. var
  4705. instr: taicpu;
  4706. begin
  4707. if (fromsize=OS_F32) and
  4708. (tosize=OS_F32) then
  4709. begin
  4710. instr:=setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32);
  4711. list.Concat(instr);
  4712. add_move_instruction(instr);
  4713. end
  4714. else if (fromsize=OS_F64) and
  4715. (tosize=OS_F64) then
  4716. begin
  4717. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,tregister(longint(reg2)+1),tregister(longint(reg1)+1)), PF_F32));
  4718. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32));
  4719. end
  4720. else if (fromsize=OS_F32) and
  4721. (tosize=OS_F64) then
  4722. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VCVT,reg2,reg1), PF_F32))
  4723. begin
  4724. //list.concat(nil);
  4725. end;
  4726. end;
  4727. procedure tthumb2cgarm.a_loadmm_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  4728. begin
  4729. handle_load_store(list,A_VLDR,PF_None,reg,ref);
  4730. end;
  4731. procedure tthumb2cgarm.a_loadmm_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  4732. begin
  4733. handle_load_store(list,A_VSTR,PF_None,reg,ref);
  4734. end;
  4735. procedure tthumb2cgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize: tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  4736. begin
  4737. if //(shuffle=nil) and
  4738. (tosize=OS_F32) then
  4739. list.Concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg))
  4740. else
  4741. internalerror(2012100813);
  4742. end;
  4743. procedure tthumb2cgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize: tcgsize; mmreg, intreg: tregister; shuffle: pmmshuffle);
  4744. begin
  4745. if //(shuffle=nil) and
  4746. (fromsize=OS_F32) then
  4747. list.Concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg))
  4748. else
  4749. internalerror(2012100814);
  4750. end;
  4751. procedure tthumb2cg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  4752. var tmpreg: tregister;
  4753. begin
  4754. case op of
  4755. OP_NEG:
  4756. begin
  4757. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4758. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  4759. tmpreg:=cg.getintregister(list,OS_32);
  4760. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,0));
  4761. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,tmpreg,regsrc.reghi));
  4762. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4763. end;
  4764. else
  4765. inherited a_op64_reg_reg(list, op, size, regsrc, regdst);
  4766. end;
  4767. end;
  4768. procedure tthumbcg64farm.a_op64_reg_reg(list: TAsmList; op: TOpCG; size: tcgsize; regsrc, regdst: tregister64);
  4769. begin
  4770. case op of
  4771. OP_NEG:
  4772. begin
  4773. list.concat(taicpu.op_reg_const(A_MOV,regdst.reglo,0));
  4774. list.concat(taicpu.op_reg_const(A_MOV,regdst.reghi,0));
  4775. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4776. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4777. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4778. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4779. end;
  4780. OP_NOT:
  4781. begin
  4782. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  4783. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  4784. end;
  4785. OP_AND,OP_OR,OP_XOR:
  4786. begin
  4787. cg.a_op_reg_reg(list,op,OS_32,regsrc.reglo,regdst.reglo);
  4788. cg.a_op_reg_reg(list,op,OS_32,regsrc.reghi,regdst.reghi);
  4789. end;
  4790. OP_ADD:
  4791. begin
  4792. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4793. list.concat(taicpu.op_reg_reg(A_ADD,regdst.reglo,regsrc.reglo));
  4794. list.concat(taicpu.op_reg_reg(A_ADC,regdst.reghi,regsrc.reghi));
  4795. end;
  4796. OP_SUB:
  4797. begin
  4798. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4799. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4800. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4801. end;
  4802. else
  4803. internalerror(2003083101);
  4804. end;
  4805. end;
  4806. procedure tthumbcg64farm.a_op64_const_reg(list: TAsmList; op: TOpCG; size: tcgsize; value: int64; reg: tregister64);
  4807. var
  4808. tmpreg : tregister;
  4809. begin
  4810. case op of
  4811. OP_AND,OP_OR,OP_XOR:
  4812. begin
  4813. cg.a_op_const_reg(list,op,OS_32,aint(lo(value)),reg.reglo);
  4814. cg.a_op_const_reg(list,op,OS_32,aint(hi(value)),reg.reghi);
  4815. end;
  4816. OP_ADD:
  4817. begin
  4818. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4819. begin
  4820. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4821. list.concat(taicpu.op_reg_const(A_ADD,reg.reglo,aint(lo(value))));
  4822. end
  4823. else
  4824. begin
  4825. tmpreg:=cg.getintregister(list,OS_32);
  4826. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4827. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4828. list.concat(taicpu.op_reg_reg(A_ADD,reg.reglo,tmpreg));
  4829. end;
  4830. tmpreg:=cg.getintregister(list,OS_32);
  4831. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  4832. list.concat(taicpu.op_reg_reg(A_ADC,reg.reghi,tmpreg));
  4833. end;
  4834. OP_SUB:
  4835. begin
  4836. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4837. begin
  4838. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4839. list.concat(taicpu.op_reg_const(A_SUB,reg.reglo,aint(lo(value))))
  4840. end
  4841. else
  4842. begin
  4843. tmpreg:=cg.getintregister(list,OS_32);
  4844. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4845. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4846. list.concat(taicpu.op_reg_reg(A_SUB,reg.reglo,tmpreg));
  4847. end;
  4848. tmpreg:=cg.getintregister(list,OS_32);
  4849. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  4850. list.concat(taicpu.op_reg_reg(A_SBC,reg.reghi,tmpreg));
  4851. end;
  4852. else
  4853. internalerror(2003083101);
  4854. end;
  4855. end;
  4856. procedure create_codegen;
  4857. begin
  4858. if GenerateThumb2Code then
  4859. begin
  4860. cg:=tthumb2cgarm.create;
  4861. cg64:=tthumb2cg64farm.create;
  4862. casmoptimizer:=TCpuThumb2AsmOptimizer;
  4863. end
  4864. else if GenerateThumbCode then
  4865. begin
  4866. cg:=tthumbcgarm.create;
  4867. cg64:=tthumbcg64farm.create;
  4868. // casmoptimizer:=TCpuThumbAsmOptimizer;
  4869. end
  4870. else
  4871. begin
  4872. cg:=tarmcgarm.create;
  4873. cg64:=tarmcg64farm.create;
  4874. casmoptimizer:=TCpuAsmOptimizer;
  4875. end;
  4876. end;
  4877. end.