cgcpu.pas 214 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912291329142915291629172918291929202921292229232924292529262927292829292930293129322933293429352936293729382939294029412942294329442945294629472948294929502951295229532954295529562957295829592960296129622963296429652966296729682969297029712972297329742975297629772978297929802981298229832984298529862987298829892990299129922993299429952996299729982999300030013002300330043005300630073008300930103011301230133014301530163017301830193020302130223023302430253026302730283029303030313032303330343035303630373038303930403041304230433044304530463047304830493050305130523053305430553056305730583059306030613062306330643065306630673068306930703071307230733074307530763077307830793080308130823083308430853086308730883089309030913092309330943095309630973098309931003101310231033104310531063107310831093110311131123113311431153116311731183119312031213122312331243125312631273128312931303131313231333134313531363137313831393140314131423143314431453146314731483149315031513152315331543155315631573158315931603161316231633164316531663167316831693170317131723173317431753176317731783179318031813182318331843185318631873188318931903191319231933194319531963197319831993200320132023203320432053206320732083209321032113212321332143215321632173218321932203221322232233224322532263227322832293230323132323233323432353236323732383239324032413242324332443245324632473248324932503251325232533254325532563257325832593260326132623263326432653266326732683269327032713272327332743275327632773278327932803281328232833284328532863287328832893290329132923293329432953296329732983299330033013302330333043305330633073308330933103311331233133314331533163317331833193320332133223323332433253326332733283329333033313332333333343335333633373338333933403341334233433344334533463347334833493350335133523353335433553356335733583359336033613362336333643365336633673368336933703371337233733374337533763377337833793380338133823383338433853386338733883389339033913392339333943395339633973398339934003401340234033404340534063407340834093410341134123413341434153416341734183419342034213422342334243425342634273428342934303431343234333434343534363437343834393440344134423443344434453446344734483449345034513452345334543455345634573458345934603461346234633464346534663467346834693470347134723473347434753476347734783479348034813482348334843485348634873488348934903491349234933494349534963497349834993500350135023503350435053506350735083509351035113512351335143515351635173518351935203521352235233524352535263527352835293530353135323533353435353536353735383539354035413542354335443545354635473548354935503551355235533554355535563557355835593560356135623563356435653566356735683569357035713572357335743575357635773578357935803581358235833584358535863587358835893590359135923593359435953596359735983599360036013602360336043605360636073608360936103611361236133614361536163617361836193620362136223623362436253626362736283629363036313632363336343635363636373638363936403641364236433644364536463647364836493650365136523653365436553656365736583659366036613662366336643665366636673668366936703671367236733674367536763677367836793680368136823683368436853686368736883689369036913692369336943695369636973698369937003701370237033704370537063707370837093710371137123713371437153716371737183719372037213722372337243725372637273728372937303731373237333734373537363737373837393740374137423743374437453746374737483749375037513752375337543755375637573758375937603761376237633764376537663767376837693770377137723773377437753776377737783779378037813782378337843785378637873788378937903791379237933794379537963797379837993800380138023803380438053806380738083809381038113812381338143815381638173818381938203821382238233824382538263827382838293830383138323833383438353836383738383839384038413842384338443845384638473848384938503851385238533854385538563857385838593860386138623863386438653866386738683869387038713872387338743875387638773878387938803881388238833884388538863887388838893890389138923893389438953896389738983899390039013902390339043905390639073908390939103911391239133914391539163917391839193920392139223923392439253926392739283929393039313932393339343935393639373938393939403941394239433944394539463947394839493950395139523953395439553956395739583959396039613962396339643965396639673968396939703971397239733974397539763977397839793980398139823983398439853986398739883989399039913992399339943995399639973998399940004001400240034004400540064007400840094010401140124013401440154016401740184019402040214022402340244025402640274028402940304031403240334034403540364037403840394040404140424043404440454046404740484049405040514052405340544055405640574058405940604061406240634064406540664067406840694070407140724073407440754076407740784079408040814082408340844085408640874088408940904091409240934094409540964097409840994100410141024103410441054106410741084109411041114112411341144115411641174118411941204121412241234124412541264127412841294130413141324133413441354136413741384139414041414142414341444145414641474148414941504151415241534154415541564157415841594160416141624163416441654166416741684169417041714172417341744175417641774178417941804181418241834184418541864187418841894190419141924193419441954196419741984199420042014202420342044205420642074208420942104211421242134214421542164217421842194220422142224223422442254226422742284229423042314232423342344235423642374238423942404241424242434244424542464247424842494250425142524253425442554256425742584259426042614262426342644265426642674268426942704271427242734274427542764277427842794280428142824283428442854286428742884289429042914292429342944295429642974298429943004301430243034304430543064307430843094310431143124313431443154316431743184319432043214322432343244325432643274328432943304331433243334334433543364337433843394340434143424343434443454346434743484349435043514352435343544355435643574358435943604361436243634364436543664367436843694370437143724373437443754376437743784379438043814382438343844385438643874388438943904391439243934394439543964397439843994400440144024403440444054406440744084409441044114412441344144415441644174418441944204421442244234424442544264427442844294430443144324433443444354436443744384439444044414442444344444445444644474448444944504451445244534454445544564457445844594460446144624463446444654466446744684469447044714472447344744475447644774478447944804481448244834484448544864487448844894490449144924493449444954496449744984499450045014502450345044505450645074508450945104511451245134514451545164517451845194520452145224523452445254526452745284529453045314532453345344535453645374538453945404541454245434544454545464547454845494550455145524553455445554556455745584559456045614562456345644565456645674568456945704571457245734574457545764577457845794580458145824583458445854586458745884589459045914592459345944595459645974598459946004601460246034604460546064607460846094610461146124613461446154616461746184619462046214622462346244625462646274628462946304631463246334634463546364637463846394640464146424643464446454646464746484649465046514652465346544655465646574658465946604661466246634664466546664667466846694670467146724673467446754676467746784679468046814682468346844685468646874688468946904691469246934694469546964697469846994700470147024703470447054706470747084709471047114712471347144715471647174718471947204721472247234724472547264727472847294730473147324733473447354736473747384739474047414742474347444745474647474748474947504751475247534754475547564757475847594760476147624763476447654766476747684769477047714772477347744775477647774778477947804781478247834784478547864787478847894790479147924793479447954796479747984799480048014802480348044805480648074808480948104811481248134814481548164817481848194820482148224823482448254826482748284829483048314832483348344835483648374838483948404841484248434844484548464847484848494850485148524853485448554856485748584859486048614862486348644865486648674868486948704871487248734874487548764877487848794880488148824883488448854886488748884889489048914892489348944895489648974898489949004901490249034904490549064907490849094910491149124913491449154916491749184919492049214922492349244925492649274928492949304931493249334934493549364937493849394940494149424943494449454946494749484949495049514952495349544955495649574958495949604961496249634964496549664967496849694970497149724973497449754976497749784979498049814982498349844985498649874988498949904991499249934994499549964997499849995000500150025003500450055006500750085009501050115012501350145015501650175018501950205021502250235024502550265027502850295030503150325033503450355036503750385039504050415042504350445045504650475048504950505051505250535054505550565057505850595060506150625063506450655066506750685069507050715072507350745075507650775078507950805081508250835084508550865087508850895090509150925093509450955096509750985099510051015102510351045105510651075108510951105111511251135114511551165117511851195120512151225123512451255126512751285129513051315132513351345135513651375138513951405141514251435144514551465147514851495150515151525153515451555156515751585159516051615162516351645165516651675168516951705171517251735174517551765177517851795180518151825183518451855186518751885189519051915192519351945195519651975198519952005201520252035204520552065207520852095210521152125213521452155216521752185219522052215222522352245225522652275228522952305231523252335234523552365237523852395240524152425243524452455246524752485249525052515252525352545255525652575258525952605261526252635264526552665267526852695270527152725273527452755276527752785279528052815282528352845285528652875288528952905291529252935294529552965297529852995300530153025303530453055306530753085309531053115312531353145315531653175318531953205321532253235324532553265327
  1. {
  2. Copyright (c) 2003 by Florian Klaempfl
  3. Member of the Free Pascal development team
  4. This unit implements the code generator for the ARM
  5. This program is free software; you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation; either version 2 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program; if not, write to the Free Software
  15. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  16. ****************************************************************************
  17. }
  18. unit cgcpu;
  19. {$i fpcdefs.inc}
  20. interface
  21. uses
  22. globtype,symtype,symdef,
  23. cgbase,cgutils,cgobj,
  24. aasmbase,aasmcpu,aasmtai,aasmdata,
  25. parabase,
  26. cpubase,cpuinfo,cg64f32,rgcpu;
  27. type
  28. { tbasecgarm is shared between all arm architectures }
  29. tbasecgarm = class(tcg)
  30. { true, if the next arithmetic operation should modify the flags }
  31. cgsetflags : boolean;
  32. procedure a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);override;
  33. protected
  34. procedure a_load_ref_cgparalocref(list: TAsmList; sourcesize: tcgsize; sizeleft: tcgint; const ref, paralocref: treference; const cgpara: tcgpara; const location: PCGParaLocation); override;
  35. public
  36. procedure a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);override;
  37. procedure a_call_name(list : TAsmList;const s : string; weak: boolean);override;
  38. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  39. { move instructions }
  40. procedure a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);override;
  41. procedure a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);override;
  42. function a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  43. function a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  44. { fpu move instructions }
  45. procedure a_loadfpu_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister); override;
  46. procedure a_loadfpu_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister); override;
  47. procedure a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference); override;
  48. procedure a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);override;
  49. { comparison operations }
  50. procedure a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  51. l : tasmlabel);override;
  52. procedure a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel); override;
  53. procedure a_jmp_name(list : TAsmList;const s : string); override;
  54. procedure a_jmp_always(list : TAsmList;l: tasmlabel); override;
  55. procedure a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel); override;
  56. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  57. procedure g_profilecode(list : TAsmList); override;
  58. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  59. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  60. procedure g_maybe_got_init(list : TAsmList); override;
  61. procedure a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);override;
  62. procedure g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);override;
  63. procedure g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);override;
  64. procedure g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  65. procedure g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  66. procedure g_overflowcheck(list: TAsmList; const l: tlocation; def: tdef); override;
  67. procedure g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);override;
  68. procedure g_save_registers(list : TAsmList);override;
  69. procedure g_restore_registers(list : TAsmList);override;
  70. procedure a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  71. procedure fixref(list : TAsmList;var ref : treference);
  72. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; virtual;
  73. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  74. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  75. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  76. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  77. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  78. procedure a_opmm_reg_reg(list: TAsmList; Op: TOpCG; size : tcgsize;src,dst: tregister;shuffle : pmmshuffle); override;
  79. { Transform unsupported methods into Internal errors }
  80. procedure a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister); override;
  81. { try to generate optimized 32 Bit multiplication, returns true if successful generated }
  82. function try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  83. { clear out potential overflow bits from 8 or 16 bit operations
  84. the upper 24/16 bits of a register after an operation }
  85. procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  86. { mla for thumb requires that none of the registers is equal to r13/r15, this method ensures this }
  87. procedure safe_mla(list: TAsmList;op1,op2,op3,op4 : TRegister);
  88. procedure g_maybe_tls_init(list : TAsmList); override;
  89. end;
  90. { tcgarm is shared between normal arm and thumb-2 }
  91. tcgarm = class(tbasecgarm)
  92. procedure a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister); override;
  93. procedure a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference); override;
  94. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  95. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  96. size: tcgsize; a: tcgint; src, dst: tregister); override;
  97. procedure a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  98. size: tcgsize; src1, src2, dst: tregister); override;
  99. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  100. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  101. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  102. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  103. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  104. {Multiply two 32-bit registers into lo and hi 32-bit registers}
  105. procedure a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister); override;
  106. end;
  107. { normal arm cg }
  108. tarmcgarm = class(tcgarm)
  109. procedure init_register_allocators;override;
  110. procedure done_register_allocators;override;
  111. end;
  112. { 64 bit cg for all arm flavours }
  113. tbasecg64farm = class(tcg64f32)
  114. end;
  115. { tcg64farm is shared between normal arm and thumb-2 }
  116. tcg64farm = class(tbasecg64farm)
  117. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  118. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  119. procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;
  120. procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  121. procedure a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  122. procedure a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  123. procedure a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);override;
  124. procedure a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);override;
  125. end;
  126. tarmcg64farm = class(tcg64farm)
  127. end;
  128. tthumbcgarm = class(tbasecgarm)
  129. procedure init_register_allocators;override;
  130. procedure done_register_allocators;override;
  131. procedure g_proc_entry(list: TAsmList; localsize: longint; nostackframe: boolean);override;
  132. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  133. procedure a_op_reg_reg(list: TAsmList; Op: TOpCG; size: TCGSize; src,dst: TRegister);override;
  134. procedure a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);override;
  135. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister); override;
  136. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  137. procedure a_load_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const Ref: treference; reg: tregister);override;
  138. procedure a_load_const_reg(list: TAsmList; size: tcgsize; a: tcgint; reg: tregister);override;
  139. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  140. function handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference; override;
  141. end;
  142. tthumbcg64farm = class(tbasecg64farm)
  143. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  144. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  145. end;
  146. tthumb2cgarm = class(tcgarm)
  147. procedure init_register_allocators;override;
  148. procedure done_register_allocators;override;
  149. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  150. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  151. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  152. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  153. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  154. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  155. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  156. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  157. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  158. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; override;
  159. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  160. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  161. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  162. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  163. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  164. end;
  165. tthumb2cg64farm = class(tcg64farm)
  166. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  167. end;
  168. const
  169. OpCmp2AsmCond : Array[topcmp] of TAsmCond = (C_NONE,C_EQ,C_GT,
  170. C_LT,C_GE,C_LE,C_NE,C_LS,C_CC,C_CS,C_HI);
  171. winstackpagesize = 4096;
  172. function get_fpu_postfix(def : tdef) : toppostfix;
  173. procedure create_codegen;
  174. implementation
  175. uses
  176. globals,verbose,systems,cutils,
  177. aopt,aoptcpu,
  178. fmodule,
  179. symconst,symsym,symtable,
  180. tgobj,
  181. procinfo,cpupi,
  182. paramgr;
  183. { Range check must be disabled explicitly as conversions between signed and unsigned
  184. 32-bit values are done without explicit typecasts }
  185. {$R-}
  186. function get_fpu_postfix(def : tdef) : toppostfix;
  187. begin
  188. if def.typ=floatdef then
  189. begin
  190. case tfloatdef(def).floattype of
  191. s32real:
  192. result:=PF_S;
  193. s64real:
  194. result:=PF_D;
  195. s80real:
  196. result:=PF_E;
  197. else
  198. internalerror(200401272);
  199. end;
  200. end
  201. else
  202. internalerror(200401271);
  203. end;
  204. procedure tarmcgarm.init_register_allocators;
  205. begin
  206. inherited init_register_allocators;
  207. { currently, we always save R14, so we can use it }
  208. if (target_info.system<>system_arm_darwin) then
  209. begin
  210. if assigned(current_procinfo) and (current_procinfo.framepointer<>NR_R11) then
  211. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  212. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  213. RS_R9,RS_R10,RS_R11,RS_R14],first_int_imreg,[])
  214. else
  215. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  216. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  217. RS_R9,RS_R10,RS_R14],first_int_imreg,[])
  218. end
  219. else
  220. { r7 is not available on Darwin, it's used as frame pointer (always,
  221. for backtrace support -- also in gcc/clang -> R11 can be used).
  222. r9 is volatile }
  223. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  224. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R9,RS_R12,RS_R4,RS_R5,RS_R6,RS_R8,
  225. RS_R10,RS_R11,RS_R14],first_int_imreg,[]);
  226. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  227. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  228. { The register allocator currently cannot deal with multiple
  229. non-overlapping subregs per register, so we can only use
  230. half the single precision registers for now (as sub registers of the
  231. double precision ones). }
  232. if current_settings.fputype in [fpu_vfpv3,fpu_vfpv4] then
  233. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  234. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  235. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  236. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  237. ],first_mm_imreg,[])
  238. else
  239. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  240. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15],first_mm_imreg,[]);
  241. end;
  242. procedure tarmcgarm.done_register_allocators;
  243. begin
  244. rg[R_INTREGISTER].free;
  245. rg[R_FPUREGISTER].free;
  246. rg[R_MMREGISTER].free;
  247. inherited done_register_allocators;
  248. end;
  249. procedure tcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  250. var
  251. imm_shift : byte;
  252. l : tasmlabel;
  253. hr : treference;
  254. imm1, imm2: DWord;
  255. begin
  256. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  257. internalerror(2002090902);
  258. if is_shifter_const(a,imm_shift) then
  259. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  260. else if is_shifter_const(not(a),imm_shift) then
  261. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  262. { loading of constants with mov and orr }
  263. else if (split_into_shifter_const(a,imm1, imm2)) then
  264. begin
  265. list.concat(taicpu.op_reg_const(A_MOV,reg, imm1));
  266. list.concat(taicpu.op_reg_reg_const(A_ORR,reg,reg, imm2));
  267. end
  268. { loading of constants with mvn and bic }
  269. else if (split_into_shifter_const(not(a), imm1, imm2)) then
  270. begin
  271. list.concat(taicpu.op_reg_const(A_MVN,reg, imm1));
  272. list.concat(taicpu.op_reg_reg_const(A_BIC,reg,reg, imm2));
  273. end
  274. else
  275. begin
  276. reference_reset(hr,4,[]);
  277. current_asmdata.getjumplabel(l);
  278. cg.a_label(current_procinfo.aktlocaldata,l);
  279. hr.symboldata:=current_procinfo.aktlocaldata.last;
  280. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  281. hr.symbol:=l;
  282. hr.base:=NR_PC;
  283. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  284. end;
  285. end;
  286. procedure tcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  287. var
  288. oppostfix:toppostfix;
  289. usedtmpref: treference;
  290. tmpreg,tmpreg2 : tregister;
  291. so : tshifterop;
  292. dir : integer;
  293. begin
  294. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  295. FromSize := ToSize;
  296. case FromSize of
  297. { signed integer registers }
  298. OS_8:
  299. oppostfix:=PF_B;
  300. OS_S8:
  301. oppostfix:=PF_SB;
  302. OS_16:
  303. oppostfix:=PF_H;
  304. OS_S16:
  305. oppostfix:=PF_SH;
  306. OS_32,
  307. OS_S32:
  308. oppostfix:=PF_None;
  309. else
  310. InternalError(200308297);
  311. end;
  312. if (fromsize=OS_S8) and
  313. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  314. oppostfix:=PF_B;
  315. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize])) or
  316. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  317. (oppostfix in [PF_SH,PF_H])) then
  318. begin
  319. if target_info.endian=endian_big then
  320. dir:=-1
  321. else
  322. dir:=1;
  323. case FromSize of
  324. OS_16,OS_S16:
  325. begin
  326. { only complicated references need an extra loadaddr }
  327. if assigned(ref.symbol) or
  328. (ref.index<>NR_NO) or
  329. (ref.offset<-4095) or
  330. (ref.offset>4094) or
  331. { sometimes the compiler reused registers }
  332. (reg=ref.index) or
  333. (reg=ref.base) then
  334. begin
  335. tmpreg2:=getintregister(list,OS_INT);
  336. a_loadaddr_ref_reg(list,ref,tmpreg2);
  337. reference_reset_base(usedtmpref,tmpreg2,0,ref.temppos,ref.alignment,ref.volatility);
  338. end
  339. else
  340. usedtmpref:=ref;
  341. if target_info.endian=endian_big then
  342. inc(usedtmpref.offset,1);
  343. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  344. tmpreg:=getintregister(list,OS_INT);
  345. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  346. inc(usedtmpref.offset,dir);
  347. if FromSize=OS_16 then
  348. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  349. else
  350. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  351. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  352. end;
  353. OS_32,OS_S32:
  354. begin
  355. tmpreg:=getintregister(list,OS_INT);
  356. { only complicated references need an extra loadaddr }
  357. if assigned(ref.symbol) or
  358. (ref.index<>NR_NO) or
  359. (ref.offset<-4095) or
  360. (ref.offset>4092) or
  361. { sometimes the compiler reused registers }
  362. (reg=ref.index) or
  363. (reg=ref.base) then
  364. begin
  365. tmpreg2:=getintregister(list,OS_INT);
  366. a_loadaddr_ref_reg(list,ref,tmpreg2);
  367. reference_reset_base(usedtmpref,tmpreg2,0,ref.temppos,ref.alignment,ref.volatility);
  368. end
  369. else
  370. usedtmpref:=ref;
  371. shifterop_reset(so);so.shiftmode:=SM_LSL;
  372. if ref.alignment=2 then
  373. begin
  374. if target_info.endian=endian_big then
  375. inc(usedtmpref.offset,2);
  376. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  377. inc(usedtmpref.offset,dir*2);
  378. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  379. so.shiftimm:=16;
  380. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  381. end
  382. else
  383. begin
  384. tmpreg2:=getintregister(list,OS_INT);
  385. if target_info.endian=endian_big then
  386. inc(usedtmpref.offset,3);
  387. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  388. inc(usedtmpref.offset,dir);
  389. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  390. inc(usedtmpref.offset,dir);
  391. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg2);
  392. so.shiftimm:=8;
  393. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  394. inc(usedtmpref.offset,dir);
  395. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  396. so.shiftimm:=16;
  397. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg2,so));
  398. so.shiftimm:=24;
  399. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  400. end;
  401. end
  402. else
  403. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  404. end;
  405. end
  406. else
  407. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  408. if (fromsize=OS_S8) and
  409. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  410. a_load_reg_reg(list,OS_S8,OS_32,reg,reg)
  411. else if (fromsize=OS_S8) and (tosize = OS_16) then
  412. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  413. end;
  414. procedure tcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  415. var
  416. hsym : tsym;
  417. href : treference;
  418. paraloc : Pcgparalocation;
  419. shift : byte;
  420. begin
  421. { calculate the parameter info for the procdef }
  422. procdef.init_paraloc_info(callerside);
  423. hsym:=tsym(procdef.parast.Find('self'));
  424. if not(assigned(hsym) and
  425. (hsym.typ=paravarsym)) then
  426. internalerror(200305251);
  427. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  428. while paraloc<>nil do
  429. with paraloc^ do
  430. begin
  431. case loc of
  432. LOC_REGISTER:
  433. begin
  434. if is_shifter_const(ioffset,shift) then
  435. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  436. else
  437. begin
  438. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  439. a_op_reg_reg(list,OP_SUB,size,NR_R12,register);
  440. end;
  441. end;
  442. LOC_REFERENCE:
  443. begin
  444. { offset in the wrapper needs to be adjusted for the stored
  445. return address }
  446. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),ctempposinvalid,sizeof(pint),[]);
  447. if is_shifter_const(ioffset,shift) then
  448. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  449. else
  450. begin
  451. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  452. a_op_reg_ref(list,OP_SUB,size,NR_R12,href);
  453. end;
  454. end
  455. else
  456. internalerror(200309189);
  457. end;
  458. paraloc:=next;
  459. end;
  460. end;
  461. procedure tbasecgarm.a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);
  462. var
  463. ref: treference;
  464. begin
  465. paraloc.check_simple_location;
  466. paramanager.allocparaloc(list,paraloc.location);
  467. case paraloc.location^.loc of
  468. LOC_REGISTER,LOC_CREGISTER:
  469. a_load_const_reg(list,size,a,paraloc.location^.register);
  470. LOC_REFERENCE:
  471. begin
  472. reference_reset(ref,paraloc.alignment,[]);
  473. ref.base:=paraloc.location^.reference.index;
  474. ref.offset:=paraloc.location^.reference.offset;
  475. a_load_const_ref(list,size,a,ref);
  476. end;
  477. else
  478. internalerror(2002081101);
  479. end;
  480. end;
  481. procedure tbasecgarm.a_load_ref_cgparalocref(list: TAsmList; sourcesize: tcgsize; sizeleft: tcgint; const ref, paralocref: treference; const cgpara: tcgpara; const location: PCGParaLocation);
  482. begin
  483. { doubles in softemu mode have a strange order of registers and references }
  484. if (cgpara.size=OS_F64) and
  485. (location^.size=OS_32) then
  486. begin
  487. g_concatcopy(list,ref,paralocref,4)
  488. end
  489. else
  490. inherited;
  491. end;
  492. procedure tbasecgarm.a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);
  493. var
  494. ref: treference;
  495. tmpreg: tregister;
  496. begin
  497. paraloc.check_simple_location;
  498. paramanager.allocparaloc(list,paraloc.location);
  499. case paraloc.location^.loc of
  500. LOC_REGISTER,LOC_CREGISTER:
  501. a_loadaddr_ref_reg(list,r,paraloc.location^.register);
  502. LOC_REFERENCE:
  503. begin
  504. reference_reset(ref,paraloc.alignment,[]);
  505. ref.base := paraloc.location^.reference.index;
  506. ref.offset := paraloc.location^.reference.offset;
  507. tmpreg := getintregister(list,OS_ADDR);
  508. a_loadaddr_ref_reg(list,r,tmpreg);
  509. a_load_reg_ref(list,OS_ADDR,OS_ADDR,tmpreg,ref);
  510. end;
  511. else
  512. internalerror(2002080701);
  513. end;
  514. end;
  515. procedure tbasecgarm.a_call_name(list : TAsmList;const s : string; weak: boolean);
  516. var
  517. branchopcode: tasmop;
  518. r : treference;
  519. sym : TAsmSymbol;
  520. begin
  521. { use always BL as newer binutils do not translate blx apparently
  522. generating BL is also what clang and gcc do by default }
  523. branchopcode:=A_BL;
  524. if not(weak) then
  525. sym:=current_asmdata.RefAsmSymbol(s,AT_FUNCTION)
  526. else
  527. sym:=current_asmdata.WeakRefAsmSymbol(s,AT_FUNCTION);
  528. reference_reset_symbol(r,sym,0,sizeof(pint),[]);
  529. if (tf_pic_uses_got in target_info.flags) and
  530. (cs_create_pic in current_settings.moduleswitches) then
  531. begin
  532. r.refaddr:=addr_pic
  533. end
  534. else
  535. r.refaddr:=addr_full;
  536. list.concat(taicpu.op_ref(branchopcode,r));
  537. {
  538. the compiler does not properly set this flag anymore in pass 1, and
  539. for now we only need it after pass 2 (I hope) (JM)
  540. if not(pi_do_call in current_procinfo.flags) then
  541. internalerror(2003060703);
  542. }
  543. include(current_procinfo.flags,pi_do_call);
  544. end;
  545. procedure tbasecgarm.a_call_reg(list : TAsmList;reg: tregister);
  546. begin
  547. { check not really correct: should only be used for non-Thumb cpus }
  548. if not(CPUARM_HAS_BLX in cpu_capabilities[current_settings.cputype]) then
  549. begin
  550. list.concat(taicpu.op_reg_reg(A_MOV,NR_R14,NR_PC));
  551. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,reg));
  552. end
  553. else
  554. list.concat(taicpu.op_reg(A_BLX, reg));
  555. {
  556. the compiler does not properly set this flag anymore in pass 1, and
  557. for now we only need it after pass 2 (I hope) (JM)
  558. if not(pi_do_call in current_procinfo.flags) then
  559. internalerror(2003060703);
  560. }
  561. include(current_procinfo.flags,pi_do_call);
  562. end;
  563. procedure tcgarm.a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister);
  564. begin
  565. a_op_const_reg_reg(list,op,size,a,reg,reg);
  566. end;
  567. procedure tcgarm.a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference);
  568. var
  569. tmpreg,tmpresreg : tregister;
  570. tmpref : treference;
  571. begin
  572. tmpreg:=getintregister(list,size);
  573. tmpresreg:=getintregister(list,size);
  574. tmpref:=a_internal_load_ref_reg(list,size,size,ref,tmpreg);
  575. a_op_const_reg_reg(list,op,size,a,tmpreg,tmpresreg);
  576. a_load_reg_ref(list,size,size,tmpresreg,tmpref);
  577. end;
  578. procedure tcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  579. var
  580. so : tshifterop;
  581. begin
  582. if op = OP_NEG then
  583. begin
  584. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,src,0));
  585. maybeadjustresult(list,OP_NEG,size,dst);
  586. end
  587. else if op = OP_NOT then
  588. begin
  589. if size in [OS_8, OS_16, OS_S8, OS_S16] then
  590. begin
  591. shifterop_reset(so);
  592. so.shiftmode:=SM_LSL;
  593. if size in [OS_8, OS_S8] then
  594. so.shiftimm:=24
  595. else
  596. so.shiftimm:=16;
  597. list.concat(taicpu.op_reg_reg_shifterop(A_MVN,dst,src,so));
  598. {Using a shift here allows this to be folded into another instruction}
  599. if size in [OS_S8, OS_S16] then
  600. so.shiftmode:=SM_ASR
  601. else
  602. so.shiftmode:=SM_LSR;
  603. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  604. end
  605. else
  606. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  607. end
  608. else
  609. a_op_reg_reg_reg(list,op,size,src,dst,dst);
  610. end;
  611. const
  612. op_reg_reg_opcg2asmop: array[TOpCG] of tasmop =
  613. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  614. A_NONE,A_NONE,A_NONE,A_SUB,A_EOR,A_NONE,A_NONE);
  615. op_reg_opcg2asmop: array[TOpCG] of tasmop =
  616. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  617. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  618. op_reg_postfix: array[TOpCG] of TOpPostfix =
  619. (PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,
  620. PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None);
  621. procedure tcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  622. size: tcgsize; a: tcgint; src, dst: tregister);
  623. var
  624. ovloc : tlocation;
  625. begin
  626. a_op_const_reg_reg_checkoverflow(list,op,size,a,src,dst,false,ovloc);
  627. end;
  628. procedure tcgarm.a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  629. size: tcgsize; src1, src2, dst: tregister);
  630. var
  631. ovloc : tlocation;
  632. begin
  633. a_op_reg_reg_reg_checkoverflow(list,op,size,src1,src2,dst,false,ovloc);
  634. end;
  635. function opshift2shiftmode(op: TOpCg): tshiftmode;
  636. begin
  637. case op of
  638. OP_SHL: Result:=SM_LSL;
  639. OP_SHR: Result:=SM_LSR;
  640. OP_ROR: Result:=SM_ROR;
  641. OP_ROL: Result:=SM_ROR;
  642. OP_SAR: Result:=SM_ASR;
  643. else internalerror(2012070501);
  644. end
  645. end;
  646. function tbasecgarm.try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  647. var
  648. multiplier : dword;
  649. power : longint;
  650. shifterop : tshifterop;
  651. bitsset : byte;
  652. negative : boolean;
  653. first : boolean;
  654. b,
  655. cycles : byte;
  656. maxeffort : byte;
  657. begin
  658. result:=true;
  659. cycles:=0;
  660. negative:=a<0;
  661. shifterop.rs:=NR_NO;
  662. shifterop.shiftmode:=SM_LSL;
  663. if negative then
  664. inc(cycles);
  665. multiplier:=dword(abs(a));
  666. bitsset:=popcnt(multiplier and $fffffffe);
  667. { heuristics to estimate how much instructions are reasonable to replace the mul,
  668. this is currently based on XScale timings }
  669. { in the simplest case, we need a mov to load the constant and a mul to carry out the
  670. actual multiplication, this requires min. 1+4 cycles
  671. because the first shift imm. might cause a stall and because we need more instructions
  672. when replacing the mul we generate max. 3 instructions to replace this mul }
  673. maxeffort:=3;
  674. { if the constant is not a shifter op, we need either some mov/mvn/bic/or sequence or
  675. a ldr, so generating one more operation to replace this is beneficial }
  676. if not(is_shifter_const(dword(a),b)) and not(is_shifter_const(not(dword(a)),b)) then
  677. inc(maxeffort);
  678. { if the upper 5 bits are all set or clear, mul is one cycle faster }
  679. if ((dword(a) and $f8000000)=0) or ((dword(a) and $f8000000)=$f8000000) then
  680. dec(maxeffort);
  681. { if the upper 17 bits are all set or clear, mul is another cycle faster }
  682. if ((dword(a) and $ffff8000)=0) or ((dword(a) and $ffff8000)=$ffff8000) then
  683. dec(maxeffort);
  684. { most simple cases }
  685. if a=1 then
  686. a_load_reg_reg(list,OS_32,OS_32,src,dst)
  687. else if a=0 then
  688. a_load_const_reg(list,OS_32,0,dst)
  689. else if a=-1 then
  690. a_op_reg_reg(list,OP_NEG,OS_32,src,dst)
  691. { add up ?
  692. basically, one add is needed for each bit being set in the constant factor
  693. however, the least significant bit is for free, it can be hidden in the initial
  694. instruction
  695. }
  696. else if (bitsset+cycles<=maxeffort) and
  697. (bitsset<=popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)) then
  698. begin
  699. first:=true;
  700. while multiplier<>0 do
  701. begin
  702. shifterop.shiftimm:=BsrDWord(multiplier);
  703. if odd(multiplier) then
  704. begin
  705. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,shifterop));
  706. dec(multiplier);
  707. end
  708. else
  709. if first then
  710. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  711. else
  712. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,src,shifterop));
  713. first:=false;
  714. dec(multiplier,1 shl shifterop.shiftimm);
  715. end;
  716. if negative then
  717. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  718. end
  719. { subtract from the next greater power of two? }
  720. else if popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)+cycles+1<=maxeffort then
  721. begin
  722. first:=true;
  723. while multiplier<>0 do
  724. begin
  725. if first then
  726. begin
  727. multiplier:=(1 shl power)-multiplier;
  728. shifterop.shiftimm:=power;
  729. end
  730. else
  731. shifterop.shiftimm:=BsrDWord(multiplier);
  732. if odd(multiplier) then
  733. begin
  734. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,shifterop));
  735. dec(multiplier);
  736. end
  737. else
  738. if first then
  739. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  740. else
  741. begin
  742. list.concat(taicpu.op_reg_reg_reg_shifterop(A_SUB,dst,dst,src,shifterop));
  743. dec(multiplier,1 shl shifterop.shiftimm);
  744. end;
  745. first:=false;
  746. end;
  747. if negative then
  748. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  749. end
  750. else
  751. result:=false;
  752. end;
  753. procedure tcgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  754. var
  755. shift, lsb, width : byte;
  756. tmpreg : tregister;
  757. so : tshifterop;
  758. l1 : longint;
  759. imm1, imm2: DWord;
  760. begin
  761. optimize_op_const(size, op, a);
  762. case op of
  763. OP_NONE:
  764. begin
  765. if src <> dst then
  766. a_load_reg_reg(list, size, size, src, dst);
  767. exit;
  768. end;
  769. OP_MOVE:
  770. begin
  771. a_load_const_reg(list, size, a, dst);
  772. exit;
  773. end;
  774. end;
  775. ovloc.loc:=LOC_VOID;
  776. if {$ifopt R+}(a<>-2147483648) and{$endif} not setflags and is_shifter_const(-a,shift) then
  777. case op of
  778. OP_ADD:
  779. begin
  780. op:=OP_SUB;
  781. a:=aint(dword(-a));
  782. end;
  783. OP_SUB:
  784. begin
  785. op:=OP_ADD;
  786. a:=aint(dword(-a));
  787. end
  788. end;
  789. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  790. case op of
  791. OP_NEG,OP_NOT:
  792. internalerror(200308281);
  793. OP_SHL,
  794. OP_SHR,
  795. OP_ROL,
  796. OP_ROR,
  797. OP_SAR:
  798. begin
  799. if a>32 then
  800. internalerror(200308294);
  801. shifterop_reset(so);
  802. so.shiftmode:=opshift2shiftmode(op);
  803. if op = OP_ROL then
  804. so.shiftimm:=32-a
  805. else
  806. so.shiftimm:=a;
  807. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  808. end;
  809. else
  810. {if (op in [OP_SUB, OP_ADD]) and
  811. ((a < 0) or
  812. (a > 4095)) then
  813. begin
  814. tmpreg:=getintregister(list,size);
  815. list.concat(taicpu.op_reg_const(A_MOVT, tmpreg, (a shr 16) and $FFFF));
  816. list.concat(taicpu.op_reg_const(A_MOV, tmpreg, a and $FFFF));
  817. list.concat(setoppostfix(taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))
  818. ));
  819. end
  820. else}
  821. begin
  822. if cgsetflags or setflags then
  823. a_reg_alloc(list,NR_DEFAULTFLAGS);
  824. list.concat(setoppostfix(
  825. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  826. end;
  827. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  828. begin
  829. ovloc.loc:=LOC_FLAGS;
  830. case op of
  831. OP_ADD:
  832. ovloc.resflags:=F_CS;
  833. OP_SUB:
  834. ovloc.resflags:=F_CC;
  835. end;
  836. end;
  837. end
  838. else
  839. begin
  840. { there could be added some more sophisticated optimizations }
  841. if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  842. a_op_reg_reg(list,OP_NEG,size,src,dst)
  843. { we do this here instead in the peephole optimizer because
  844. it saves us a register }
  845. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  846. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  847. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  848. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  849. begin
  850. if l1>32 then{roozbeh does this ever happen?}
  851. internalerror(200308296);
  852. shifterop_reset(so);
  853. so.shiftmode:=SM_LSL;
  854. so.shiftimm:=l1;
  855. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  856. end
  857. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  858. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  859. begin
  860. if l1>32 then{does this ever happen?}
  861. internalerror(201205181);
  862. shifterop_reset(so);
  863. so.shiftmode:=SM_LSL;
  864. so.shiftimm:=l1;
  865. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  866. end
  867. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  868. begin
  869. { nothing to do on success }
  870. end
  871. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  872. broader range of shifterconstants.}
  873. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  874. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  875. { Doing two shifts instead of two bics might allow the peephole optimizer to fold the second shift
  876. into the following instruction}
  877. else if (op = OP_AND) and
  878. is_continuous_mask(aword(a), lsb, width) and
  879. ((lsb = 0) or ((lsb + width) = 32)) then
  880. begin
  881. shifterop_reset(so);
  882. if (width = 16) and
  883. (lsb = 0) and
  884. (current_settings.cputype >= cpu_armv6) then
  885. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  886. else if (width = 8) and
  887. (lsb = 0) and
  888. (current_settings.cputype >= cpu_armv6) then
  889. list.concat(taicpu.op_reg_reg(A_UXTB,dst,src))
  890. else if lsb = 0 then
  891. begin
  892. so.shiftmode:=SM_LSL;
  893. so.shiftimm:=32-width;
  894. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  895. so.shiftmode:=SM_LSR;
  896. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  897. end
  898. else
  899. begin
  900. so.shiftmode:=SM_LSR;
  901. so.shiftimm:=lsb;
  902. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  903. so.shiftmode:=SM_LSL;
  904. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  905. end;
  906. end
  907. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  908. begin
  909. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,imm1));
  910. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  911. end
  912. else if (op in [OP_ADD, OP_SUB, OP_OR, OP_XOR]) and
  913. not(cgsetflags or setflags) and
  914. split_into_shifter_const(a, imm1, imm2) then
  915. begin
  916. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,imm1));
  917. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  918. end
  919. else
  920. begin
  921. tmpreg:=getintregister(list,size);
  922. a_load_const_reg(list,size,a,tmpreg);
  923. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  924. end;
  925. end;
  926. maybeadjustresult(list,op,size,dst);
  927. end;
  928. procedure tcgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  929. var
  930. so : tshifterop;
  931. tmpreg,overflowreg : tregister;
  932. asmop : tasmop;
  933. begin
  934. ovloc.loc:=LOC_VOID;
  935. case op of
  936. OP_NEG,OP_NOT,
  937. OP_DIV,OP_IDIV:
  938. internalerror(200308283);
  939. OP_SHL,
  940. OP_SHR,
  941. OP_SAR,
  942. OP_ROR:
  943. begin
  944. if (op = OP_ROR) and not(size in [OS_32,OS_S32]) then
  945. internalerror(2008072801);
  946. shifterop_reset(so);
  947. so.rs:=src1;
  948. so.shiftmode:=opshift2shiftmode(op);
  949. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  950. end;
  951. OP_ROL:
  952. begin
  953. if not(size in [OS_32,OS_S32]) then
  954. internalerror(2008072801);
  955. { simulate ROL by ror'ing 32-value }
  956. tmpreg:=getintregister(list,OS_32);
  957. list.concat(taicpu.op_reg_reg_const(A_RSB,tmpreg,src1, 32));
  958. shifterop_reset(so);
  959. so.rs:=tmpreg;
  960. so.shiftmode:=SM_ROR;
  961. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  962. end;
  963. OP_IMUL,
  964. OP_MUL:
  965. begin
  966. if (cgsetflags or setflags) and
  967. (CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype]) then
  968. begin
  969. overflowreg:=getintregister(list,size);
  970. if op=OP_IMUL then
  971. asmop:=A_SMULL
  972. else
  973. asmop:=A_UMULL;
  974. { the arm doesn't allow that rd and rm are the same }
  975. if dst=src2 then
  976. begin
  977. if dst<>src1 then
  978. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  979. else
  980. begin
  981. tmpreg:=getintregister(list,size);
  982. a_load_reg_reg(list,size,size,src2,dst);
  983. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  984. end;
  985. end
  986. else
  987. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  988. a_reg_alloc(list,NR_DEFAULTFLAGS);
  989. if op=OP_IMUL then
  990. begin
  991. shifterop_reset(so);
  992. so.shiftmode:=SM_ASR;
  993. so.shiftimm:=31;
  994. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  995. end
  996. else
  997. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  998. ovloc.loc:=LOC_FLAGS;
  999. ovloc.resflags:=F_NE;
  1000. end
  1001. else
  1002. begin
  1003. { the arm doesn't allow that rd and rm are the same }
  1004. if dst=src2 then
  1005. begin
  1006. if dst<>src1 then
  1007. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  1008. else
  1009. begin
  1010. tmpreg:=getintregister(list,size);
  1011. a_load_reg_reg(list,size,size,src2,dst);
  1012. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  1013. end;
  1014. end
  1015. else
  1016. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  1017. end;
  1018. end;
  1019. else
  1020. begin
  1021. if cgsetflags or setflags then
  1022. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1023. list.concat(setoppostfix(
  1024. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  1025. end;
  1026. end;
  1027. maybeadjustresult(list,op,size,dst);
  1028. end;
  1029. procedure tcgarm.a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister);
  1030. var
  1031. asmop: tasmop;
  1032. begin
  1033. if CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype] then
  1034. begin
  1035. list.concat(tai_comment.create(strpnew('tcgarm.a_mul_reg_reg_pair called')));
  1036. case size of
  1037. OS_32: asmop:=A_UMULL;
  1038. OS_S32: asmop:=A_SMULL;
  1039. else
  1040. InternalError(2014060802);
  1041. end;
  1042. { The caller might omit dstlo or dsthi, when he is not interested in it, we still
  1043. need valid registers everywhere. In case of dsthi = NR_NO we could fall back to
  1044. 32x32=32 bit multiplication}
  1045. if (dstlo = NR_NO) then
  1046. dstlo:=getintregister(list,size);
  1047. if (dsthi = NR_NO) then
  1048. dsthi:=getintregister(list,size);
  1049. list.concat(taicpu.op_reg_reg_reg_reg(asmop, dstlo, dsthi, src1,src2));
  1050. end
  1051. else if dsthi=NR_NO then
  1052. begin
  1053. if (dstlo = NR_NO) then
  1054. dstlo:=getintregister(list,size);
  1055. list.concat(taicpu.op_reg_reg_reg(A_MUL, dstlo, src1,src2));
  1056. end
  1057. else
  1058. begin
  1059. internalerror(2015083022);
  1060. end;
  1061. end;
  1062. function tbasecgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  1063. var
  1064. tmpreg1,tmpreg2 : tregister;
  1065. begin
  1066. tmpreg1:=NR_NO;
  1067. { Be sure to have a base register }
  1068. if (ref.base=NR_NO) then
  1069. begin
  1070. if ref.shiftmode<>SM_None then
  1071. internalerror(2014020701);
  1072. ref.base:=ref.index;
  1073. ref.index:=NR_NO;
  1074. end;
  1075. { absolute symbols can't be handled directly, we've to store the symbol reference
  1076. in the text segment and access it pc relative
  1077. For now, we assume that references where base or index equals to PC are already
  1078. relative, all other references are assumed to be absolute and thus they need
  1079. to be handled extra.
  1080. A proper solution would be to change refoptions to a set and store the information
  1081. if the symbol is absolute or relative there.
  1082. }
  1083. if (assigned(ref.symbol) and
  1084. not(is_pc(ref.base)) and
  1085. not(is_pc(ref.index))
  1086. ) or
  1087. { [#xxx] isn't a valid address operand }
  1088. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  1089. (ref.offset<-4095) or
  1090. (ref.offset>4095) or
  1091. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  1092. ((ref.offset<-255) or
  1093. (ref.offset>255)
  1094. )
  1095. ) or
  1096. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1097. ((ref.offset<-1020) or
  1098. (ref.offset>1020) or
  1099. ((abs(ref.offset) mod 4)<>0)
  1100. )
  1101. ) or
  1102. ((GenerateThumbCode) and
  1103. (((oppostfix in [PF_SB,PF_SH]) and (ref.offset<>0)) or
  1104. ((oppostfix=PF_None) and ((ref.offset<0) or ((ref.base<>NR_STACK_POINTER_REG) and (ref.offset>124)) or
  1105. ((ref.base=NR_STACK_POINTER_REG) and (ref.offset>1020)) or ((ref.offset mod 4)<>0))) or
  1106. ((oppostfix=PF_H) and ((ref.offset<0) or (ref.offset>62) or ((ref.offset mod 2)<>0) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0)))) or
  1107. ((oppostfix=PF_B) and ((ref.offset<0) or (ref.offset>31) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0))))
  1108. )
  1109. ) then
  1110. begin
  1111. fixref(list,ref);
  1112. end;
  1113. if GenerateThumbCode then
  1114. begin
  1115. { certain thumb load require base and index }
  1116. if (oppostfix in [PF_SB,PF_SH]) and
  1117. (ref.base<>NR_NO) and (ref.index=NR_NO) then
  1118. begin
  1119. tmpreg1:=getintregister(list,OS_ADDR);
  1120. a_load_const_reg(list,OS_ADDR,0,tmpreg1);
  1121. ref.index:=tmpreg1;
  1122. end;
  1123. { "hi" registers cannot be used as base or index }
  1124. if (getsupreg(ref.base) in [RS_R8..RS_R12,RS_R14]) or
  1125. ((ref.base=NR_R13) and (ref.index<>NR_NO)) then
  1126. begin
  1127. tmpreg1:=getintregister(list,OS_ADDR);
  1128. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.base,tmpreg1);
  1129. ref.base:=tmpreg1;
  1130. end;
  1131. if getsupreg(ref.index) in [RS_R8..RS_R14] then
  1132. begin
  1133. tmpreg1:=getintregister(list,OS_ADDR);
  1134. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.index,tmpreg1);
  1135. ref.index:=tmpreg1;
  1136. end;
  1137. end;
  1138. { fold if there is base, index and offset, however, don't fold
  1139. for vfp memory instructions because we later fold the index }
  1140. if not((op in [A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1141. (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  1142. begin
  1143. if tmpreg1<>NR_NO then
  1144. begin
  1145. tmpreg2:=getintregister(list,OS_ADDR);
  1146. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg1,tmpreg2);
  1147. tmpreg1:=tmpreg2;
  1148. end
  1149. else
  1150. begin
  1151. tmpreg1:=getintregister(list,OS_ADDR);
  1152. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg1);
  1153. ref.base:=tmpreg1;
  1154. end;
  1155. ref.offset:=0;
  1156. end;
  1157. { floating point operations have only limited references
  1158. we expect here, that a base is already set }
  1159. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  1160. begin
  1161. if ref.shiftmode<>SM_none then
  1162. internalerror(200309121);
  1163. if tmpreg1<>NR_NO then
  1164. begin
  1165. if ref.base=tmpreg1 then
  1166. begin
  1167. if ref.signindex<0 then
  1168. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,tmpreg1,ref.index))
  1169. else
  1170. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,tmpreg1,ref.index));
  1171. ref.index:=NR_NO;
  1172. end
  1173. else
  1174. begin
  1175. if ref.index<>tmpreg1 then
  1176. internalerror(200403161);
  1177. if ref.signindex<0 then
  1178. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,ref.base,tmpreg1))
  1179. else
  1180. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,tmpreg1));
  1181. ref.base:=tmpreg1;
  1182. ref.index:=NR_NO;
  1183. end;
  1184. end
  1185. else
  1186. begin
  1187. tmpreg1:=getintregister(list,OS_ADDR);
  1188. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,ref.index));
  1189. ref.base:=tmpreg1;
  1190. ref.index:=NR_NO;
  1191. end;
  1192. end;
  1193. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  1194. Result := ref;
  1195. end;
  1196. procedure tbasecgarm.a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);
  1197. var
  1198. oppostfix:toppostfix;
  1199. usedtmpref: treference;
  1200. tmpreg : tregister;
  1201. dir : integer;
  1202. begin
  1203. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  1204. FromSize := ToSize;
  1205. case ToSize of
  1206. { signed integer registers }
  1207. OS_8,
  1208. OS_S8:
  1209. oppostfix:=PF_B;
  1210. OS_16,
  1211. OS_S16:
  1212. oppostfix:=PF_H;
  1213. OS_32,
  1214. OS_S32,
  1215. { for vfp value stored in integer register }
  1216. OS_F32:
  1217. oppostfix:=PF_None;
  1218. else
  1219. InternalError(200308299);
  1220. end;
  1221. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[tosize])) or
  1222. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  1223. (oppostfix =PF_H)) then
  1224. begin
  1225. if target_info.endian=endian_big then
  1226. dir:=-1
  1227. else
  1228. dir:=1;
  1229. case FromSize of
  1230. OS_16,OS_S16:
  1231. begin
  1232. tmpreg:=getintregister(list,OS_INT);
  1233. usedtmpref:=ref;
  1234. if target_info.endian=endian_big then
  1235. inc(usedtmpref.offset,1);
  1236. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1237. inc(usedtmpref.offset,dir);
  1238. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1239. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1240. end;
  1241. OS_32,OS_S32:
  1242. begin
  1243. tmpreg:=getintregister(list,OS_INT);
  1244. usedtmpref:=ref;
  1245. if ref.alignment=2 then
  1246. begin
  1247. if target_info.endian=endian_big then
  1248. inc(usedtmpref.offset,2);
  1249. usedtmpref:=a_internal_load_reg_ref(list,OS_16,OS_16,reg,usedtmpref);
  1250. a_op_const_reg_reg(list,OP_SHR,OS_INT,16,reg,tmpreg);
  1251. inc(usedtmpref.offset,dir*2);
  1252. a_internal_load_reg_ref(list,OS_16,OS_16,tmpreg,usedtmpref);
  1253. end
  1254. else
  1255. begin
  1256. if target_info.endian=endian_big then
  1257. inc(usedtmpref.offset,3);
  1258. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1259. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1260. inc(usedtmpref.offset,dir);
  1261. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1262. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1263. inc(usedtmpref.offset,dir);
  1264. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1265. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1266. inc(usedtmpref.offset,dir);
  1267. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1268. end;
  1269. end
  1270. else
  1271. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1272. end;
  1273. end
  1274. else
  1275. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1276. end;
  1277. function tbasecgarm.a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  1278. var
  1279. oppostfix:toppostfix;
  1280. href: treference;
  1281. tmpreg: TRegister;
  1282. begin
  1283. case ToSize of
  1284. { signed integer registers }
  1285. OS_8,
  1286. OS_S8:
  1287. oppostfix:=PF_B;
  1288. OS_16,
  1289. OS_S16:
  1290. oppostfix:=PF_H;
  1291. OS_32,
  1292. OS_S32:
  1293. oppostfix:=PF_None;
  1294. else
  1295. InternalError(2003082910);
  1296. end;
  1297. if (tosize in [OS_S16,OS_16]) and
  1298. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1299. begin
  1300. result:=handle_load_store(list,A_STR,PF_B,reg,ref);
  1301. tmpreg:=getintregister(list,OS_INT);
  1302. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1303. href:=result;
  1304. inc(href.offset);
  1305. handle_load_store(list,A_STR,PF_B,tmpreg,href);
  1306. end
  1307. else
  1308. result:=handle_load_store(list,A_STR,oppostfix,reg,ref);
  1309. end;
  1310. function tbasecgarm.a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  1311. var
  1312. oppostfix:toppostfix;
  1313. so: tshifterop;
  1314. tmpreg: TRegister;
  1315. href: treference;
  1316. begin
  1317. case FromSize of
  1318. { signed integer registers }
  1319. OS_8:
  1320. oppostfix:=PF_B;
  1321. OS_S8:
  1322. oppostfix:=PF_SB;
  1323. OS_16:
  1324. oppostfix:=PF_H;
  1325. OS_S16:
  1326. oppostfix:=PF_SH;
  1327. OS_32,
  1328. OS_S32:
  1329. oppostfix:=PF_None;
  1330. else
  1331. InternalError(200308291);
  1332. end;
  1333. if (tosize=OS_S8) and
  1334. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1335. begin
  1336. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1337. a_load_reg_reg(list,OS_S8,OS_32,reg,reg);
  1338. end
  1339. else if (tosize in [OS_S16,OS_16]) and
  1340. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1341. begin
  1342. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1343. tmpreg:=getintregister(list,OS_INT);
  1344. href:=result;
  1345. inc(href.offset);
  1346. handle_load_store(list,A_LDR,PF_B,tmpreg,href);
  1347. shifterop_reset(so);
  1348. so.shiftmode:=SM_LSL;
  1349. so.shiftimm:=8;
  1350. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  1351. end
  1352. else
  1353. result:=handle_load_store(list,A_LDR,oppostfix,reg,ref);
  1354. end;
  1355. procedure tbasecgarm.a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);
  1356. var
  1357. so : tshifterop;
  1358. procedure do_shift(shiftmode : tshiftmode; shiftimm : byte; reg : tregister);
  1359. begin
  1360. if GenerateThumbCode then
  1361. begin
  1362. case shiftmode of
  1363. SM_ASR:
  1364. a_op_const_reg_reg(list,OP_SAR,OS_32,shiftimm,reg,reg2);
  1365. SM_LSR:
  1366. a_op_const_reg_reg(list,OP_SHR,OS_32,shiftimm,reg,reg2);
  1367. SM_LSL:
  1368. a_op_const_reg_reg(list,OP_SHL,OS_32,shiftimm,reg,reg2);
  1369. else
  1370. internalerror(2013090301);
  1371. end;
  1372. end
  1373. else
  1374. begin
  1375. so.shiftmode:=shiftmode;
  1376. so.shiftimm:=shiftimm;
  1377. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,reg2,reg,so));
  1378. end;
  1379. end;
  1380. var
  1381. instr: taicpu;
  1382. conv_done: boolean;
  1383. begin
  1384. if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then
  1385. internalerror(2002090901);
  1386. conv_done:=false;
  1387. if tosize<>fromsize then
  1388. begin
  1389. shifterop_reset(so);
  1390. conv_done:=true;
  1391. if tcgsize2size[tosize]<=tcgsize2size[fromsize] then
  1392. fromsize:=tosize;
  1393. if current_settings.cputype<cpu_armv6 then
  1394. case fromsize of
  1395. OS_8:
  1396. if GenerateThumbCode then
  1397. a_op_const_reg_reg(list,OP_AND,OS_32,$ff,reg1,reg2)
  1398. else
  1399. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1400. OS_S8:
  1401. begin
  1402. do_shift(SM_LSL,24,reg1);
  1403. if tosize=OS_16 then
  1404. begin
  1405. do_shift(SM_ASR,8,reg2);
  1406. do_shift(SM_LSR,16,reg2);
  1407. end
  1408. else
  1409. do_shift(SM_ASR,24,reg2);
  1410. end;
  1411. OS_16:
  1412. begin
  1413. do_shift(SM_LSL,16,reg1);
  1414. do_shift(SM_LSR,16,reg2);
  1415. end;
  1416. OS_S16:
  1417. begin
  1418. do_shift(SM_LSL,16,reg1);
  1419. do_shift(SM_ASR,16,reg2)
  1420. end;
  1421. else
  1422. conv_done:=false;
  1423. end
  1424. else
  1425. case fromsize of
  1426. OS_8:
  1427. if GenerateThumbCode then
  1428. list.concat(taicpu.op_reg_reg(A_UXTB,reg2,reg1))
  1429. else
  1430. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1431. OS_S8:
  1432. begin
  1433. if tosize=OS_16 then
  1434. begin
  1435. so.shiftmode:=SM_ROR;
  1436. so.shiftimm:=16;
  1437. list.concat(taicpu.op_reg_reg_shifterop(A_SXTB16,reg2,reg1,so));
  1438. do_shift(SM_LSR,16,reg2);
  1439. end
  1440. else
  1441. list.concat(taicpu.op_reg_reg(A_SXTB,reg2,reg1));
  1442. end;
  1443. OS_16:
  1444. list.concat(taicpu.op_reg_reg(A_UXTH,reg2,reg1));
  1445. OS_S16:
  1446. list.concat(taicpu.op_reg_reg(A_SXTH,reg2,reg1));
  1447. else
  1448. conv_done:=false;
  1449. end
  1450. end;
  1451. if not conv_done and (reg1<>reg2) then
  1452. begin
  1453. { same size, only a register mov required }
  1454. instr:=taicpu.op_reg_reg(A_MOV,reg2,reg1);
  1455. list.Concat(instr);
  1456. { Notify the register allocator that we have written a move instruction so
  1457. it can try to eliminate it. }
  1458. add_move_instruction(instr);
  1459. end;
  1460. end;
  1461. procedure tbasecgarm.a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);
  1462. var
  1463. href,href2 : treference;
  1464. hloc : pcgparalocation;
  1465. begin
  1466. href:=ref;
  1467. hloc:=paraloc.location;
  1468. while assigned(hloc) do
  1469. begin
  1470. case hloc^.loc of
  1471. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  1472. begin
  1473. paramanager.allocparaloc(list,paraloc.location);
  1474. a_loadfpu_ref_reg(list,size,size,ref,hloc^.register);
  1475. end;
  1476. LOC_REGISTER :
  1477. case hloc^.size of
  1478. OS_32,
  1479. OS_F32:
  1480. begin
  1481. paramanager.allocparaloc(list,paraloc.location);
  1482. a_load_ref_reg(list,OS_32,OS_32,href,hloc^.register);
  1483. end;
  1484. OS_64,
  1485. OS_F64:
  1486. cg64.a_load64_ref_cgpara(list,href,paraloc);
  1487. else
  1488. a_load_ref_reg(list,hloc^.size,hloc^.size,href,hloc^.register);
  1489. end;
  1490. LOC_REFERENCE :
  1491. begin
  1492. reference_reset_base(href2,hloc^.reference.index,hloc^.reference.offset,ctempposinvalid,paraloc.alignment,[]);
  1493. { concatcopy should choose the best way to copy the data }
  1494. g_concatcopy(list,href,href2,tcgsize2size[hloc^.size]);
  1495. end;
  1496. else
  1497. internalerror(200408241);
  1498. end;
  1499. inc(href.offset,tcgsize2size[hloc^.size]);
  1500. hloc:=hloc^.next;
  1501. end;
  1502. end;
  1503. procedure tbasecgarm.a_loadfpu_reg_reg(list: TAsmList; fromsize,tosize: tcgsize; reg1, reg2: tregister);
  1504. begin
  1505. list.concat(setoppostfix(taicpu.op_reg_reg(A_MVF,reg2,reg1),cgsize2fpuoppostfix[tosize]));
  1506. end;
  1507. procedure tbasecgarm.a_loadfpu_ref_reg(list: TAsmList; fromsize,tosize: tcgsize; const ref: treference; reg: tregister);
  1508. var
  1509. oppostfix:toppostfix;
  1510. begin
  1511. case fromsize of
  1512. OS_32,
  1513. OS_F32:
  1514. oppostfix:=PF_S;
  1515. OS_64,
  1516. OS_F64:
  1517. oppostfix:=PF_D;
  1518. OS_F80:
  1519. oppostfix:=PF_E;
  1520. else
  1521. InternalError(200309021);
  1522. end;
  1523. handle_load_store(list,A_LDF,oppostfix,reg,ref);
  1524. if fromsize<>tosize then
  1525. a_loadfpu_reg_reg(list,fromsize,tosize,reg,reg);
  1526. end;
  1527. procedure tbasecgarm.a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);
  1528. var
  1529. oppostfix:toppostfix;
  1530. begin
  1531. case tosize of
  1532. OS_F32:
  1533. oppostfix:=PF_S;
  1534. OS_F64:
  1535. oppostfix:=PF_D;
  1536. OS_F80:
  1537. oppostfix:=PF_E;
  1538. else
  1539. InternalError(200309022);
  1540. end;
  1541. handle_load_store(list,A_STF,oppostfix,reg,ref);
  1542. end;
  1543. { comparison operations }
  1544. procedure tbasecgarm.a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  1545. l : tasmlabel);
  1546. var
  1547. tmpreg : tregister;
  1548. b : byte;
  1549. begin
  1550. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1551. if (not(GenerateThumbCode) and is_shifter_const(a,b)) or
  1552. ((GenerateThumbCode) and is_thumb_imm(a)) then
  1553. list.concat(taicpu.op_reg_const(A_CMP,reg,a))
  1554. { CMN reg,0 and CMN reg,$80000000 are different from CMP reg,$ffffffff
  1555. and CMP reg,$7fffffff regarding the flags according to the ARM manual }
  1556. else if (a<>$7fffffff) and (a<>-1) and not(GenerateThumbCode) and is_shifter_const(-a,b) then
  1557. list.concat(taicpu.op_reg_const(A_CMN,reg,-a))
  1558. else
  1559. begin
  1560. tmpreg:=getintregister(list,size);
  1561. a_load_const_reg(list,size,a,tmpreg);
  1562. list.concat(taicpu.op_reg_reg(A_CMP,reg,tmpreg));
  1563. end;
  1564. a_jmp_cond(list,cmp_op,l);
  1565. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1566. end;
  1567. procedure tbasecgarm.a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister);
  1568. begin
  1569. if reverse then
  1570. begin
  1571. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,src));
  1572. list.Concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,31));
  1573. list.Concat(taicpu.op_reg_reg_const(A_AND,dst,dst,255));
  1574. end
  1575. { it is decided during the compilation of the system unit if this code is used or not
  1576. so no additional check for rbit is needed }
  1577. else
  1578. begin
  1579. list.Concat(taicpu.op_reg_reg(A_RBIT,dst,src));
  1580. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,dst));
  1581. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1582. list.Concat(taicpu.op_reg_const(A_CMP,dst,32));
  1583. if GenerateThumb2Code then
  1584. list.Concat(taicpu.op_cond(A_IT, C_EQ));
  1585. list.Concat(setcondition(taicpu.op_reg_const(A_MOV,dst,$ff),C_EQ));
  1586. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1587. end;
  1588. end;
  1589. procedure tbasecgarm.a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel);
  1590. begin
  1591. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1592. list.concat(taicpu.op_reg_reg(A_CMP,reg2,reg1));
  1593. a_jmp_cond(list,cmp_op,l);
  1594. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1595. end;
  1596. procedure tbasecgarm.a_jmp_name(list : TAsmList;const s : string);
  1597. var
  1598. ai : taicpu;
  1599. begin
  1600. { generate far jump, leave it to the optimizer to get rid of it }
  1601. if GenerateThumbCode then
  1602. ai:=taicpu.op_sym(A_BL,current_asmdata.RefAsmSymbol(s,AT_FUNCTION))
  1603. else
  1604. ai:=taicpu.op_sym(A_B,current_asmdata.RefAsmSymbol(s,AT_FUNCTION));
  1605. ai.is_jmp:=true;
  1606. list.concat(ai);
  1607. end;
  1608. procedure tbasecgarm.a_jmp_always(list : TAsmList;l: tasmlabel);
  1609. var
  1610. ai : taicpu;
  1611. begin
  1612. { generate far jump, leave it to the optimizer to get rid of it }
  1613. if GenerateThumbCode then
  1614. ai:=taicpu.op_sym(A_BL,l)
  1615. else
  1616. ai:=taicpu.op_sym(A_B,l);
  1617. ai.is_jmp:=true;
  1618. list.concat(ai);
  1619. end;
  1620. procedure tbasecgarm.a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel);
  1621. var
  1622. ai : taicpu;
  1623. inv_flags : TResFlags;
  1624. hlabel : TAsmLabel;
  1625. begin
  1626. if GenerateThumbCode then
  1627. begin
  1628. inv_flags:=f;
  1629. inverse_flags(inv_flags);
  1630. { the optimizer has to fix this if jump range is sufficient short }
  1631. current_asmdata.getjumplabel(hlabel);
  1632. ai:=setcondition(taicpu.op_sym(A_B,hlabel),flags_to_cond(inv_flags));
  1633. ai.is_jmp:=true;
  1634. list.concat(ai);
  1635. a_jmp_always(list,l);
  1636. a_label(list,hlabel);
  1637. end
  1638. else
  1639. begin
  1640. ai:=setcondition(taicpu.op_sym(A_B,l),flags_to_cond(f));
  1641. ai.is_jmp:=true;
  1642. list.concat(ai);
  1643. end;
  1644. end;
  1645. procedure tbasecgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  1646. begin
  1647. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  1648. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  1649. end;
  1650. procedure tbasecgarm.g_profilecode(list : TAsmList);
  1651. begin
  1652. if target_info.system = system_arm_linux then
  1653. begin
  1654. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R14]));
  1655. a_call_name(list,'__gnu_mcount_nc',false);
  1656. end
  1657. else
  1658. internalerror(2014091201);
  1659. end;
  1660. procedure tbasecgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  1661. var
  1662. ref : treference;
  1663. shift : byte;
  1664. firstfloatreg,lastfloatreg,
  1665. r : byte;
  1666. mmregs,
  1667. regs, saveregs : tcpuregisterset;
  1668. registerarea,
  1669. r7offset,
  1670. stackmisalignment : pint;
  1671. imm1, imm2: DWord;
  1672. stack_parameters : Boolean;
  1673. begin
  1674. LocalSize:=align(LocalSize,4);
  1675. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  1676. { call instruction does not put anything on the stack }
  1677. registerarea:=0;
  1678. tcpuprocinfo(current_procinfo).stackpaddingreg:=High(TSuperRegister);
  1679. lastfloatreg:=RS_NO;
  1680. if not(nostackframe) then
  1681. begin
  1682. firstfloatreg:=RS_NO;
  1683. mmregs:=[];
  1684. case current_settings.fputype of
  1685. fpu_fpa,
  1686. fpu_fpa10,
  1687. fpu_fpa11:
  1688. begin
  1689. { save floating point registers? }
  1690. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1691. for r:=RS_F0 to RS_F7 do
  1692. if r in regs then
  1693. begin
  1694. if firstfloatreg=RS_NO then
  1695. firstfloatreg:=r;
  1696. lastfloatreg:=r;
  1697. inc(registerarea,12);
  1698. end;
  1699. end;
  1700. fpu_vfpv2,
  1701. fpu_vfpv3,
  1702. fpu_vfpv4,
  1703. fpu_vfpv3_d16:
  1704. begin;
  1705. { the *[0..31] is a hack to prevent that the compiler tries to save odd single-type registers,
  1706. they have numbers>$1f which is not really correct as they should simply have the same numbers
  1707. as the even ones by with a different subtype as it is done on x86 with al/ah }
  1708. mmregs:=(rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall))*[0..31];
  1709. end;
  1710. end;
  1711. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1712. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1713. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  1714. { save int registers }
  1715. reference_reset(ref,4,[]);
  1716. ref.index:=NR_STACK_POINTER_REG;
  1717. ref.addressmode:=AM_PREINDEXED;
  1718. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  1719. if not(target_info.system in systems_darwin) then
  1720. begin
  1721. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1722. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1723. begin
  1724. a_reg_alloc(list,NR_R12);
  1725. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  1726. end;
  1727. { the (old) ARM APCS requires saving both the stack pointer (to
  1728. crawl the stack) and the PC (to identify the function this
  1729. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  1730. and R15 -- still needs updating for EABI and Darwin, they don't
  1731. need that }
  1732. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1733. regs:=regs+[RS_FRAME_POINTER_REG,RS_R12,RS_R14,RS_R15]
  1734. else
  1735. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1736. include(regs,RS_R14);
  1737. if regs<>[] then
  1738. begin
  1739. for r:=RS_R0 to RS_R15 do
  1740. if r in regs then
  1741. inc(registerarea,4);
  1742. { if the stack is not 8 byte aligned, try to add an extra register,
  1743. so we can avoid the extra sub/add ...,#4 later (KB) }
  1744. if ((registerarea mod current_settings.alignment.localalignmax) <> 0) then
  1745. for r:=RS_R3 downto RS_R0 do
  1746. if not(r in regs) then
  1747. begin
  1748. regs:=regs+[r];
  1749. inc(registerarea,4);
  1750. tcpuprocinfo(current_procinfo).stackpaddingreg:=r;
  1751. break;
  1752. end;
  1753. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  1754. end;
  1755. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1756. begin
  1757. { the framepointer now points to the saved R15, so the saved
  1758. framepointer is at R11-12 (for get_caller_frame) }
  1759. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  1760. a_reg_dealloc(list,NR_R12);
  1761. end;
  1762. end
  1763. else
  1764. begin
  1765. { always save r14 if we use r7 as the framepointer, because
  1766. the parameter offsets are hardcoded in advance and always
  1767. assume that r14 sits on the stack right behind the saved r7
  1768. }
  1769. if current_procinfo.framepointer=NR_FRAME_POINTER_REG then
  1770. include(regs,RS_FRAME_POINTER_REG);
  1771. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1772. include(regs,RS_R14);
  1773. if regs<>[] then
  1774. begin
  1775. { on Darwin, you first have to save [r4-r7,lr], and then
  1776. [r8,r10,r11] and make r7 point to the previously saved
  1777. r7 so that you can perform a stack crawl based on it
  1778. ([r7] is previous stack frame, [r7+4] is return address
  1779. }
  1780. include(regs,RS_FRAME_POINTER_REG);
  1781. saveregs:=regs-[RS_R8,RS_R10,RS_R11];
  1782. r7offset:=0;
  1783. for r:=RS_R0 to RS_R15 do
  1784. if r in saveregs then
  1785. begin
  1786. inc(registerarea,4);
  1787. if r<RS_FRAME_POINTER_REG then
  1788. inc(r7offset,4);
  1789. end;
  1790. { save the registers }
  1791. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1792. { make r7 point to the saved r7 (regardless of whether this
  1793. frame uses the framepointer, for backtrace purposes) }
  1794. if r7offset<>0 then
  1795. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_FRAME_POINTER_REG,NR_R13,r7offset))
  1796. else
  1797. list.concat(taicpu.op_reg_reg(A_MOV,NR_R7,NR_R13));
  1798. { now save the rest (if any) }
  1799. saveregs:=regs-saveregs;
  1800. if saveregs<>[] then
  1801. begin
  1802. for r:=RS_R8 to RS_R11 do
  1803. if r in saveregs then
  1804. inc(registerarea,4);
  1805. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1806. end;
  1807. end;
  1808. end;
  1809. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  1810. if (LocalSize<>0) or
  1811. ((stackmisalignment<>0) and
  1812. ((pi_do_call in current_procinfo.flags) or
  1813. (po_assembler in current_procinfo.procdef.procoptions))) then
  1814. begin
  1815. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  1816. if stack_parameters and (pi_estimatestacksize in current_procinfo.flags) then
  1817. begin
  1818. if localsize>tcpuprocinfo(current_procinfo).stackframesize then
  1819. internalerror(2014030901)
  1820. else
  1821. localsize:=tcpuprocinfo(current_procinfo).stackframesize-registerarea;
  1822. end;
  1823. if is_shifter_const(localsize,shift) then
  1824. begin
  1825. a_reg_dealloc(list,NR_R12);
  1826. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  1827. end
  1828. else if split_into_shifter_const(localsize, imm1, imm2) then
  1829. begin
  1830. a_reg_dealloc(list,NR_R12);
  1831. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  1832. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  1833. end
  1834. else
  1835. begin
  1836. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  1837. a_reg_alloc(list,NR_R12);
  1838. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  1839. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  1840. a_reg_dealloc(list,NR_R12);
  1841. end;
  1842. end;
  1843. if (mmregs<>[]) or
  1844. (firstfloatreg<>RS_NO) then
  1845. begin
  1846. reference_reset(ref,4,[]);
  1847. if (tg.direction*tcpuprocinfo(current_procinfo).floatregstart>=1023) or
  1848. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv4,fpu_vfpv3_d16]) then
  1849. begin
  1850. if not is_shifter_const(tcpuprocinfo(current_procinfo).floatregstart,shift) then
  1851. begin
  1852. a_reg_alloc(list,NR_R12);
  1853. a_load_const_reg(list,OS_ADDR,-tcpuprocinfo(current_procinfo).floatregstart,NR_R12);
  1854. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1855. a_reg_dealloc(list,NR_R12);
  1856. end
  1857. else
  1858. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tcpuprocinfo(current_procinfo).floatregstart));
  1859. ref.base:=NR_R12;
  1860. end
  1861. else
  1862. begin
  1863. ref.base:=current_procinfo.framepointer;
  1864. ref.offset:=tcpuprocinfo(current_procinfo).floatregstart;
  1865. end;
  1866. case current_settings.fputype of
  1867. fpu_fpa,
  1868. fpu_fpa10,
  1869. fpu_fpa11:
  1870. begin
  1871. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  1872. lastfloatreg-firstfloatreg+1,ref));
  1873. end;
  1874. fpu_vfpv2,
  1875. fpu_vfpv3,
  1876. fpu_vfpv4,
  1877. fpu_vfpv3_d16:
  1878. begin
  1879. ref.index:=ref.base;
  1880. ref.base:=NR_NO;
  1881. { FSTMX is deprecated on ARMv6 and later }
  1882. {if (current_settings.cputype<cpu_armv6) then
  1883. postfix:=PF_IAX
  1884. else
  1885. postfix:=PF_IAD;}
  1886. if mmregs<>[] then
  1887. list.concat(taicpu.op_ref_regset(A_VSTM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  1888. end;
  1889. end;
  1890. end;
  1891. end;
  1892. end;
  1893. procedure tbasecgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  1894. var
  1895. ref : treference;
  1896. LocalSize : longint;
  1897. firstfloatreg,lastfloatreg,
  1898. r,
  1899. shift : byte;
  1900. mmregs,
  1901. saveregs,
  1902. regs : tcpuregisterset;
  1903. registerarea,
  1904. stackmisalignment: pint;
  1905. paddingreg: TSuperRegister;
  1906. imm1, imm2: DWord;
  1907. begin
  1908. if not(nostackframe) then
  1909. begin
  1910. registerarea:=0;
  1911. firstfloatreg:=RS_NO;
  1912. lastfloatreg:=RS_NO;
  1913. mmregs:=[];
  1914. saveregs:=[];
  1915. case current_settings.fputype of
  1916. fpu_fpa,
  1917. fpu_fpa10,
  1918. fpu_fpa11:
  1919. begin
  1920. { restore floating point registers? }
  1921. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1922. for r:=RS_F0 to RS_F7 do
  1923. if r in regs then
  1924. begin
  1925. if firstfloatreg=RS_NO then
  1926. firstfloatreg:=r;
  1927. lastfloatreg:=r;
  1928. { floating point register space is already included in
  1929. localsize below by calc_stackframe_size
  1930. inc(registerarea,12);
  1931. }
  1932. end;
  1933. end;
  1934. fpu_vfpv2,
  1935. fpu_vfpv3,
  1936. fpu_vfpv4,
  1937. fpu_vfpv3_d16:
  1938. begin;
  1939. { restore vfp registers? }
  1940. { the *[0..31] is a hack to prevent that the compiler tries to save odd single-type registers,
  1941. they have numbers>$1f which is not really correct as they should simply have the same numbers
  1942. as the even ones by with a different subtype as it is done on x86 with al/ah }
  1943. mmregs:=(rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall))*[0..31];
  1944. end;
  1945. end;
  1946. if (firstfloatreg<>RS_NO) or
  1947. (mmregs<>[]) then
  1948. begin
  1949. reference_reset(ref,4,[]);
  1950. if (tg.direction*tcpuprocinfo(current_procinfo).floatregstart>=1023) or
  1951. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv4,fpu_vfpv3_d16]) then
  1952. begin
  1953. if not is_shifter_const(tcpuprocinfo(current_procinfo).floatregstart,shift) then
  1954. begin
  1955. a_reg_alloc(list,NR_R12);
  1956. a_load_const_reg(list,OS_ADDR,-tcpuprocinfo(current_procinfo).floatregstart,NR_R12);
  1957. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1958. a_reg_dealloc(list,NR_R12);
  1959. end
  1960. else
  1961. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tcpuprocinfo(current_procinfo).floatregstart));
  1962. ref.base:=NR_R12;
  1963. end
  1964. else
  1965. begin
  1966. ref.base:=current_procinfo.framepointer;
  1967. ref.offset:=tcpuprocinfo(current_procinfo).floatregstart;
  1968. end;
  1969. case current_settings.fputype of
  1970. fpu_fpa,
  1971. fpu_fpa10,
  1972. fpu_fpa11:
  1973. begin
  1974. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  1975. lastfloatreg-firstfloatreg+1,ref));
  1976. end;
  1977. fpu_vfpv2,
  1978. fpu_vfpv3,
  1979. fpu_vfpv4,
  1980. fpu_vfpv3_d16:
  1981. begin
  1982. ref.index:=ref.base;
  1983. ref.base:=NR_NO;
  1984. { FLDMX is deprecated on ARMv6 and later }
  1985. {if (current_settings.cputype<cpu_armv6) then
  1986. mmpostfix:=PF_IAX
  1987. else
  1988. mmpostfix:=PF_IAD;}
  1989. if mmregs<>[] then
  1990. list.concat(taicpu.op_ref_regset(A_VLDM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  1991. end;
  1992. end;
  1993. end;
  1994. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  1995. if (pi_do_call in current_procinfo.flags) or
  1996. (regs<>[]) or
  1997. ((target_info.system in systems_darwin) and
  1998. (current_procinfo.framepointer<>NR_STACK_POINTER_REG)) then
  1999. begin
  2000. exclude(regs,RS_R14);
  2001. include(regs,RS_R15);
  2002. if (target_info.system in systems_darwin) then
  2003. include(regs,RS_FRAME_POINTER_REG);
  2004. end;
  2005. if not(target_info.system in systems_darwin) then
  2006. begin
  2007. { restore saved stack pointer to SP (R13) and saved lr to PC (R15).
  2008. The saved PC came after that but is discarded, since we restore
  2009. the stack pointer }
  2010. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  2011. regs:=regs+[RS_FRAME_POINTER_REG,RS_R13,RS_R15];
  2012. end
  2013. else
  2014. begin
  2015. { restore R8-R11 already if necessary (they've been stored
  2016. before the others) }
  2017. saveregs:=regs*[RS_R8,RS_R10,RS_R11];
  2018. if saveregs<>[] then
  2019. begin
  2020. reference_reset(ref,4,[]);
  2021. ref.index:=NR_STACK_POINTER_REG;
  2022. ref.addressmode:=AM_PREINDEXED;
  2023. for r:=RS_R8 to RS_R11 do
  2024. if r in saveregs then
  2025. inc(registerarea,4);
  2026. regs:=regs-saveregs;
  2027. end;
  2028. end;
  2029. for r:=RS_R0 to RS_R15 do
  2030. if r in regs then
  2031. inc(registerarea,4);
  2032. { reapply the stack padding reg, in case there was one, see the complimentary
  2033. comment in g_proc_entry() (KB) }
  2034. paddingreg:=tcpuprocinfo(current_procinfo).stackpaddingreg;
  2035. if paddingreg < RS_R4 then
  2036. if paddingreg in regs then
  2037. internalerror(201306190)
  2038. else
  2039. begin
  2040. regs:=regs+[paddingreg];
  2041. inc(registerarea,4);
  2042. end;
  2043. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  2044. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  2045. (target_info.system in systems_darwin) then
  2046. begin
  2047. LocalSize:=current_procinfo.calc_stackframe_size;
  2048. if (LocalSize<>0) or
  2049. ((stackmisalignment<>0) and
  2050. ((pi_do_call in current_procinfo.flags) or
  2051. (po_assembler in current_procinfo.procdef.procoptions))) then
  2052. begin
  2053. if pi_estimatestacksize in current_procinfo.flags then
  2054. LocalSize:=tcpuprocinfo(current_procinfo).stackframesize-registerarea
  2055. else
  2056. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  2057. if is_shifter_const(LocalSize,shift) then
  2058. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  2059. else if split_into_shifter_const(localsize, imm1, imm2) then
  2060. begin
  2061. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  2062. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  2063. end
  2064. else
  2065. begin
  2066. a_reg_alloc(list,NR_R12);
  2067. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  2068. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  2069. a_reg_dealloc(list,NR_R12);
  2070. end;
  2071. end;
  2072. if (target_info.system in systems_darwin) and
  2073. (saveregs<>[]) then
  2074. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  2075. if regs=[] then
  2076. begin
  2077. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2078. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2079. else
  2080. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2081. end
  2082. else
  2083. begin
  2084. reference_reset(ref,4,[]);
  2085. ref.index:=NR_STACK_POINTER_REG;
  2086. ref.addressmode:=AM_PREINDEXED;
  2087. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  2088. end;
  2089. end
  2090. else
  2091. begin
  2092. { restore int registers and return }
  2093. reference_reset(ref,4,[]);
  2094. ref.index:=NR_FRAME_POINTER_REG;
  2095. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_EA));
  2096. end;
  2097. end
  2098. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2099. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2100. else
  2101. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2102. end;
  2103. procedure tbasecgarm.g_maybe_got_init(list : TAsmList);
  2104. var
  2105. ref : treference;
  2106. l : TAsmLabel;
  2107. regs : tcpuregisterset;
  2108. r: byte;
  2109. begin
  2110. if (cs_create_pic in current_settings.moduleswitches) and
  2111. (pi_needs_got in current_procinfo.flags) and
  2112. (tf_pic_uses_got in target_info.flags) then
  2113. begin
  2114. { Procedure parametrs are not initialized at this stage.
  2115. Before GOT initialization code, allocate registers used for procedure parameters
  2116. to prevent usage of these registers for temp operations in later stages of code
  2117. generation. }
  2118. regs:=rg[R_INTREGISTER].used_in_proc;
  2119. for r:=RS_R0 to RS_R3 do
  2120. if r in regs then
  2121. a_reg_alloc(list, newreg(R_INTREGISTER,r,R_SUBWHOLE));
  2122. { Allocate scratch register R12 and use it for GOT calculations directly.
  2123. Otherwise the init code can be distorted in later stages of code generation. }
  2124. a_reg_alloc(list,NR_R12);
  2125. reference_reset(ref,4,[]);
  2126. current_asmdata.getglobaldatalabel(l);
  2127. cg.a_label(current_procinfo.aktlocaldata,l);
  2128. ref.symbol:=l;
  2129. ref.base:=NR_PC;
  2130. ref.symboldata:=current_procinfo.aktlocaldata.last;
  2131. list.concat(Taicpu.op_reg_ref(A_LDR,NR_R12,ref));
  2132. current_asmdata.getaddrlabel(l);
  2133. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_32bit,l,current_asmdata.RefAsmSymbol('_GLOBAL_OFFSET_TABLE_',AT_DATA),-8));
  2134. cg.a_label(list,l);
  2135. list.concat(Taicpu.op_reg_reg_reg(A_ADD,NR_R12,NR_PC,NR_R12));
  2136. list.concat(Taicpu.op_reg_reg(A_MOV,current_procinfo.got,NR_R12));
  2137. { Deallocate registers }
  2138. a_reg_dealloc(list,NR_R12);
  2139. for r:=RS_R3 downto RS_R0 do
  2140. if r in regs then
  2141. a_reg_dealloc(list, newreg(R_INTREGISTER,r,R_SUBWHOLE));
  2142. end;
  2143. end;
  2144. procedure tbasecgarm.a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);
  2145. var
  2146. b : byte;
  2147. tmpref : treference;
  2148. instr : taicpu;
  2149. begin
  2150. if ref.addressmode<>AM_OFFSET then
  2151. internalerror(200309071);
  2152. tmpref:=ref;
  2153. { Be sure to have a base register }
  2154. if (tmpref.base=NR_NO) then
  2155. begin
  2156. if tmpref.shiftmode<>SM_None then
  2157. internalerror(2014020702);
  2158. if tmpref.signindex<0 then
  2159. internalerror(200312023);
  2160. tmpref.base:=tmpref.index;
  2161. tmpref.index:=NR_NO;
  2162. end;
  2163. if assigned(tmpref.symbol) or
  2164. not((is_shifter_const(tmpref.offset,b)) or
  2165. (is_shifter_const(-tmpref.offset,b))
  2166. ) then
  2167. fixref(list,tmpref);
  2168. { expect a base here if there is an index }
  2169. if (tmpref.base=NR_NO) and (tmpref.index<>NR_NO) then
  2170. internalerror(200312022);
  2171. if tmpref.index<>NR_NO then
  2172. begin
  2173. if tmpref.shiftmode<>SM_None then
  2174. internalerror(200312021);
  2175. if tmpref.signindex<0 then
  2176. a_op_reg_reg_reg(list,OP_SUB,OS_ADDR,tmpref.base,tmpref.index,r)
  2177. else
  2178. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpref.base,tmpref.index,r);
  2179. if tmpref.offset<>0 then
  2180. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,r,r);
  2181. end
  2182. else
  2183. begin
  2184. if tmpref.base=NR_NO then
  2185. a_load_const_reg(list,OS_ADDR,tmpref.offset,r)
  2186. else
  2187. if tmpref.offset<>0 then
  2188. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,tmpref.base,r)
  2189. else
  2190. begin
  2191. instr:=taicpu.op_reg_reg(A_MOV,r,tmpref.base);
  2192. list.concat(instr);
  2193. add_move_instruction(instr);
  2194. end;
  2195. end;
  2196. end;
  2197. procedure tbasecgarm.fixref(list : TAsmList;var ref : treference);
  2198. var
  2199. tmpreg, tmpreg2 : tregister;
  2200. tmpref : treference;
  2201. l, piclabel : tasmlabel;
  2202. indirection_done : boolean;
  2203. begin
  2204. { absolute symbols can't be handled directly, we've to store the symbol reference
  2205. in the text segment and access it pc relative
  2206. For now, we assume that references where base or index equals to PC are already
  2207. relative, all other references are assumed to be absolute and thus they need
  2208. to be handled extra.
  2209. A proper solution would be to change refoptions to a set and store the information
  2210. if the symbol is absolute or relative there.
  2211. }
  2212. { create consts entry }
  2213. reference_reset(tmpref,4,[]);
  2214. current_asmdata.getjumplabel(l);
  2215. cg.a_label(current_procinfo.aktlocaldata,l);
  2216. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  2217. piclabel:=nil;
  2218. tmpreg:=NR_NO;
  2219. indirection_done:=false;
  2220. if assigned(ref.symbol) then
  2221. begin
  2222. if (target_info.system=system_arm_darwin) and
  2223. (ref.symbol.bind in [AB_EXTERNAL,AB_WEAK_EXTERNAL,AB_PRIVATE_EXTERN,AB_COMMON]) then
  2224. begin
  2225. tmpreg:=g_indirect_sym_load(list,ref.symbol.name,asmsym2indsymflags(ref.symbol));
  2226. if ref.offset<>0 then
  2227. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2228. indirection_done:=true;
  2229. end
  2230. else if ref.refaddr=addr_gottpoff then
  2231. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_gottpoff,ref.symbol,ref.relsymbol,ref.offset))
  2232. else if (cs_create_pic in current_settings.moduleswitches) then
  2233. if (tf_pic_uses_got in target_info.flags) then
  2234. current_procinfo.aktlocaldata.concat(tai_const.Create_type_sym(aitconst_got,ref.symbol))
  2235. else
  2236. begin
  2237. { ideally, we would want to generate
  2238. ldr r1, LPICConstPool
  2239. LPICLocal:
  2240. ldr/str r2,[pc,r1]
  2241. ...
  2242. LPICConstPool:
  2243. .long _globsym-(LPICLocal+8)
  2244. However, we cannot be sure that the ldr/str will follow
  2245. right after the call to fixref, so we have to load the
  2246. complete address already in a register.
  2247. }
  2248. current_asmdata.getaddrlabel(piclabel);
  2249. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_ptr,piclabel,ref.symbol,ref.offset-8));
  2250. end
  2251. else
  2252. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset))
  2253. end
  2254. else
  2255. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ref.offset));
  2256. { load consts entry }
  2257. if not indirection_done then
  2258. begin
  2259. tmpreg:=getintregister(list,OS_INT);
  2260. tmpref.symbol:=l;
  2261. tmpref.base:=NR_PC;
  2262. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2263. if (cs_create_pic in current_settings.moduleswitches) and
  2264. (tf_pic_uses_got in target_info.flags) and
  2265. assigned(ref.symbol) then
  2266. begin
  2267. reference_reset(tmpref,4,[]);
  2268. tmpref.base:=current_procinfo.got;
  2269. tmpref.index:=tmpreg;
  2270. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2271. if ref.offset<>0 then
  2272. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2273. end;
  2274. end;
  2275. if assigned(piclabel) then
  2276. begin
  2277. cg.a_label(list,piclabel);
  2278. tmpreg2:=getaddressregister(list);
  2279. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpreg,NR_PC,tmpreg2);
  2280. tmpreg:=tmpreg2
  2281. end;
  2282. { This routine can be called with PC as base/index in case the offset
  2283. was too large to encode in a load/store. In that case, the entire
  2284. absolute expression has been re-encoded in a new constpool entry, and
  2285. we have to remove the use of PC from the original reference (the code
  2286. above made everything relative to the value loaded from the new
  2287. constpool entry) }
  2288. if is_pc(ref.base) then
  2289. ref.base:=NR_NO;
  2290. if is_pc(ref.index) then
  2291. ref.index:=NR_NO;
  2292. if (ref.base<>NR_NO) then
  2293. begin
  2294. if ref.index<>NR_NO then
  2295. begin
  2296. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  2297. ref.base:=tmpreg;
  2298. end
  2299. else
  2300. if ref.base<>NR_PC then
  2301. begin
  2302. ref.index:=tmpreg;
  2303. ref.shiftimm:=0;
  2304. ref.signindex:=1;
  2305. ref.shiftmode:=SM_None;
  2306. end
  2307. else
  2308. ref.base:=tmpreg;
  2309. end
  2310. else
  2311. ref.base:=tmpreg;
  2312. ref.offset:=0;
  2313. ref.symbol:=nil;
  2314. end;
  2315. procedure tbasecgarm.g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  2316. var
  2317. paraloc1,paraloc2,paraloc3 : TCGPara;
  2318. pd : tprocdef;
  2319. begin
  2320. pd:=search_system_proc('MOVE');
  2321. paraloc1.init;
  2322. paraloc2.init;
  2323. paraloc3.init;
  2324. paramanager.getintparaloc(list,pd,1,paraloc1);
  2325. paramanager.getintparaloc(list,pd,2,paraloc2);
  2326. paramanager.getintparaloc(list,pd,3,paraloc3);
  2327. a_load_const_cgpara(list,OS_SINT,len,paraloc3);
  2328. a_loadaddr_ref_cgpara(list,dest,paraloc2);
  2329. a_loadaddr_ref_cgpara(list,source,paraloc1);
  2330. paramanager.freecgpara(list,paraloc3);
  2331. paramanager.freecgpara(list,paraloc2);
  2332. paramanager.freecgpara(list,paraloc1);
  2333. alloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2334. alloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2335. a_call_name(list,'FPC_MOVE',false);
  2336. dealloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2337. dealloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2338. paraloc3.done;
  2339. paraloc2.done;
  2340. paraloc1.done;
  2341. end;
  2342. procedure tbasecgarm.g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  2343. const
  2344. maxtmpreg_arm = 10; {roozbeh: can be reduced to 8 or lower if might conflick with reserved ones,also +2 is used becouse of regs required for referencing}
  2345. maxtmpreg_thumb = 5;
  2346. var
  2347. srcref,dstref,usedtmpref,usedtmpref2:treference;
  2348. srcreg,destreg,countreg,r,tmpreg:tregister;
  2349. helpsize:aint;
  2350. copysize:byte;
  2351. cgsize:Tcgsize;
  2352. tmpregisters:array[1..maxtmpreg_arm] of tregister;
  2353. maxtmpreg,
  2354. tmpregi,tmpregi2:byte;
  2355. { will never be called with count<=4 }
  2356. procedure genloop(count : aword;size : byte);
  2357. const
  2358. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2359. var
  2360. l : tasmlabel;
  2361. begin
  2362. current_asmdata.getjumplabel(l);
  2363. if count<size then size:=1;
  2364. a_load_const_reg(list,OS_INT,count div size,countreg);
  2365. cg.a_label(list,l);
  2366. srcref.addressmode:=AM_POSTINDEXED;
  2367. dstref.addressmode:=AM_POSTINDEXED;
  2368. srcref.offset:=size;
  2369. dstref.offset:=size;
  2370. r:=getintregister(list,size2opsize[size]);
  2371. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2372. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2373. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1),PF_S));
  2374. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2375. a_jmp_flags(list,F_NE,l);
  2376. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2377. srcref.offset:=1;
  2378. dstref.offset:=1;
  2379. case count mod size of
  2380. 1:
  2381. begin
  2382. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2383. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2384. end;
  2385. 2:
  2386. if aligned then
  2387. begin
  2388. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2389. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2390. end
  2391. else
  2392. begin
  2393. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2394. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2395. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2396. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2397. end;
  2398. 3:
  2399. if aligned then
  2400. begin
  2401. srcref.offset:=2;
  2402. dstref.offset:=2;
  2403. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2404. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2405. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2406. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2407. end
  2408. else
  2409. begin
  2410. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2411. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2412. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2413. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2414. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2415. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2416. end;
  2417. end;
  2418. { keep the registers alive }
  2419. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2420. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2421. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2422. end;
  2423. { save estimation, if a creating a separate ref is needed or
  2424. if we can keep the original reference while copying }
  2425. function SimpleRef(const ref : treference) : boolean;
  2426. begin
  2427. result:=((ref.base=NR_PC) and (ref.addressmode=AM_OFFSET) and (ref.refaddr=addr_full)) or
  2428. ((ref.symbol=nil) and
  2429. (ref.addressmode=AM_OFFSET) and
  2430. (((ref.offset>=0) and (ref.offset+len<=31)) or
  2431. (not(GenerateThumbCode) and (ref.offset>=-255) and (ref.offset+len<=255)) or
  2432. { ldrh has a limited offset range }
  2433. (not(GenerateThumbCode) and ((len mod 4) in [0,1]) and (ref.offset>=-4095) and (ref.offset+len<=4095))
  2434. )
  2435. );
  2436. end;
  2437. { will never be called with count<=4 }
  2438. procedure genloop_thumb(count : aword;size : byte);
  2439. procedure refincofs(const ref : treference;const value : longint = 1);
  2440. begin
  2441. a_op_const_reg(list,OP_ADD,OS_ADDR,value,ref.base);
  2442. end;
  2443. const
  2444. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2445. var
  2446. l : tasmlabel;
  2447. begin
  2448. current_asmdata.getjumplabel(l);
  2449. if count<size then size:=1;
  2450. a_load_const_reg(list,OS_INT,count div size,countreg);
  2451. cg.a_label(list,l);
  2452. r:=getintregister(list,size2opsize[size]);
  2453. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2454. refincofs(srcref);
  2455. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2456. refincofs(dstref);
  2457. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2458. list.concat(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1));
  2459. a_jmp_flags(list,F_NE,l);
  2460. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2461. case count mod size of
  2462. 1:
  2463. begin
  2464. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2465. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2466. end;
  2467. 2:
  2468. if aligned then
  2469. begin
  2470. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2471. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2472. end
  2473. else
  2474. begin
  2475. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2476. refincofs(srcref);
  2477. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2478. refincofs(dstref);
  2479. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2480. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2481. end;
  2482. 3:
  2483. if aligned then
  2484. begin
  2485. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2486. refincofs(srcref,2);
  2487. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2488. refincofs(dstref,2);
  2489. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2490. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2491. end
  2492. else
  2493. begin
  2494. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2495. refincofs(srcref);
  2496. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2497. refincofs(dstref);
  2498. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2499. refincofs(srcref);
  2500. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2501. refincofs(dstref);
  2502. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2503. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2504. end;
  2505. end;
  2506. { keep the registers alive }
  2507. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2508. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2509. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2510. end;
  2511. begin
  2512. if len=0 then
  2513. exit;
  2514. if GenerateThumbCode then
  2515. maxtmpreg:=maxtmpreg_thumb
  2516. else
  2517. maxtmpreg:=maxtmpreg_arm;
  2518. helpsize:=12+maxtmpreg*4;//52 with maxtmpreg=10
  2519. dstref:=dest;
  2520. srcref:=source;
  2521. if cs_opt_size in current_settings.optimizerswitches then
  2522. helpsize:=8;
  2523. if aligned and (len=4) then
  2524. begin
  2525. tmpreg:=getintregister(list,OS_32);
  2526. a_load_ref_reg(list,OS_32,OS_32,source,tmpreg);
  2527. a_load_reg_ref(list,OS_32,OS_32,tmpreg,dest);
  2528. end
  2529. else if aligned and (len=2) then
  2530. begin
  2531. tmpreg:=getintregister(list,OS_16);
  2532. a_load_ref_reg(list,OS_16,OS_16,source,tmpreg);
  2533. a_load_reg_ref(list,OS_16,OS_16,tmpreg,dest);
  2534. end
  2535. else if (len<=helpsize) and aligned then
  2536. begin
  2537. tmpregi:=0;
  2538. { loading address in a separate register needed? }
  2539. if SimpleRef(source) then
  2540. begin
  2541. { ... then we don't need a loadaddr }
  2542. srcref:=source;
  2543. end
  2544. else
  2545. begin
  2546. srcreg:=getintregister(list,OS_ADDR);
  2547. a_loadaddr_ref_reg(list,source,srcreg);
  2548. reference_reset_base(srcref,srcreg,0,source.temppos,source.alignment,source.volatility);
  2549. end;
  2550. while (len div 4 <> 0) and (tmpregi<maxtmpreg) do
  2551. begin
  2552. inc(tmpregi);
  2553. tmpregisters[tmpregi]:=getintregister(list,OS_32);
  2554. a_load_ref_reg(list,OS_32,OS_32,srcref,tmpregisters[tmpregi]);
  2555. inc(srcref.offset,4);
  2556. dec(len,4);
  2557. end;
  2558. { loading address in a separate register needed? }
  2559. if SimpleRef(dest) then
  2560. dstref:=dest
  2561. else
  2562. begin
  2563. destreg:=getintregister(list,OS_ADDR);
  2564. a_loadaddr_ref_reg(list,dest,destreg);
  2565. reference_reset_base(dstref,destreg,0,dest.temppos,dest.alignment,dest.volatility);
  2566. end;
  2567. tmpregi2:=1;
  2568. while (tmpregi2<=tmpregi) do
  2569. begin
  2570. a_load_reg_ref(list,OS_32,OS_32,tmpregisters[tmpregi2],dstref);
  2571. inc(dstref.offset,4);
  2572. inc(tmpregi2);
  2573. end;
  2574. copysize:=4;
  2575. cgsize:=OS_32;
  2576. while len<>0 do
  2577. begin
  2578. if len<2 then
  2579. begin
  2580. copysize:=1;
  2581. cgsize:=OS_8;
  2582. end
  2583. else if len<4 then
  2584. begin
  2585. copysize:=2;
  2586. cgsize:=OS_16;
  2587. end;
  2588. dec(len,copysize);
  2589. r:=getintregister(list,cgsize);
  2590. a_load_ref_reg(list,cgsize,cgsize,srcref,r);
  2591. a_load_reg_ref(list,cgsize,cgsize,r,dstref);
  2592. inc(srcref.offset,copysize);
  2593. inc(dstref.offset,copysize);
  2594. end;{end of while}
  2595. end
  2596. else
  2597. begin
  2598. cgsize:=OS_32;
  2599. if (len<=4) then{len<=4 and not aligned}
  2600. begin
  2601. r:=getintregister(list,cgsize);
  2602. usedtmpref:=a_internal_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2603. if Len=1 then
  2604. a_load_reg_ref(list,OS_8,OS_8,r,dstref)
  2605. else
  2606. begin
  2607. tmpreg:=getintregister(list,cgsize);
  2608. usedtmpref2:=a_internal_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2609. inc(usedtmpref.offset,1);
  2610. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2611. inc(usedtmpref2.offset,1);
  2612. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2613. if len>2 then
  2614. begin
  2615. inc(usedtmpref.offset,1);
  2616. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2617. inc(usedtmpref2.offset,1);
  2618. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2619. if len>3 then
  2620. begin
  2621. inc(usedtmpref.offset,1);
  2622. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2623. inc(usedtmpref2.offset,1);
  2624. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2625. end;
  2626. end;
  2627. end;
  2628. end{end of if len<=4}
  2629. else
  2630. begin{unaligned & 4<len<helpsize **or** aligned/unaligned & len>helpsize}
  2631. destreg:=getintregister(list,OS_ADDR);
  2632. a_loadaddr_ref_reg(list,dest,destreg);
  2633. reference_reset_base(dstref,destreg,0,dest.temppos,dest.alignment,dest.volatility);
  2634. srcreg:=getintregister(list,OS_ADDR);
  2635. a_loadaddr_ref_reg(list,source,srcreg);
  2636. reference_reset_base(srcref,srcreg,0,dest.temppos,source.alignment,source.volatility);
  2637. countreg:=getintregister(list,OS_32);
  2638. // if cs_opt_size in current_settings.optimizerswitches then
  2639. { roozbeh : it seems loading 1 byte is faster becouse of caching/fetching(?) }
  2640. {if aligned then
  2641. genloop(len,4)
  2642. else}
  2643. if GenerateThumbCode then
  2644. genloop_thumb(len,1)
  2645. else
  2646. genloop(len,1);
  2647. end;
  2648. end;
  2649. end;
  2650. procedure tbasecgarm.g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);
  2651. begin
  2652. g_concatcopy_internal(list,source,dest,len,false);
  2653. end;
  2654. procedure tbasecgarm.g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);
  2655. begin
  2656. if (source.alignment in [1,3]) or
  2657. (dest.alignment in [1,3]) then
  2658. g_concatcopy_internal(list,source,dest,len,false)
  2659. else
  2660. g_concatcopy_internal(list,source,dest,len,true);
  2661. end;
  2662. procedure tbasecgarm.g_overflowCheck(list : TAsmList;const l : tlocation;def : tdef);
  2663. var
  2664. ovloc : tlocation;
  2665. begin
  2666. ovloc.loc:=LOC_VOID;
  2667. g_overflowCheck_loc(list,l,def,ovloc);
  2668. end;
  2669. procedure tbasecgarm.g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);
  2670. var
  2671. hl : tasmlabel;
  2672. ai:TAiCpu;
  2673. hflags : tresflags;
  2674. begin
  2675. if not(cs_check_overflow in current_settings.localswitches) then
  2676. exit;
  2677. current_asmdata.getjumplabel(hl);
  2678. case ovloc.loc of
  2679. LOC_VOID:
  2680. begin
  2681. ai:=taicpu.op_sym(A_B,hl);
  2682. ai.is_jmp:=true;
  2683. if not((def.typ=pointerdef) or
  2684. ((def.typ=orddef) and
  2685. (torddef(def).ordtype in [u64bit,u16bit,u32bit,u8bit,uchar,
  2686. pasbool1,pasbool8,pasbool16,pasbool32,pasbool64]))) then
  2687. ai.SetCondition(C_VC)
  2688. else
  2689. if TAiCpu(List.Last).opcode in [A_RSB,A_RSC,A_SBC,A_SUB] then
  2690. ai.SetCondition(C_CS)
  2691. else
  2692. ai.SetCondition(C_CC);
  2693. list.concat(ai);
  2694. end;
  2695. LOC_FLAGS:
  2696. begin
  2697. hflags:=ovloc.resflags;
  2698. inverse_flags(hflags);
  2699. cg.a_jmp_flags(list,hflags,hl);
  2700. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2701. end;
  2702. else
  2703. internalerror(200409281);
  2704. end;
  2705. a_call_name(list,'FPC_OVERFLOW',false);
  2706. a_label(list,hl);
  2707. end;
  2708. procedure tbasecgarm.g_save_registers(list : TAsmList);
  2709. begin
  2710. { this work is done in g_proc_entry }
  2711. end;
  2712. procedure tbasecgarm.g_restore_registers(list : TAsmList);
  2713. begin
  2714. { this work is done in g_proc_exit }
  2715. end;
  2716. procedure tbasecgarm.a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  2717. var
  2718. ai : taicpu;
  2719. hlabel : TAsmLabel;
  2720. begin
  2721. if GenerateThumbCode then
  2722. begin
  2723. { the optimizer has to fix this if jump range is sufficient short }
  2724. current_asmdata.getjumplabel(hlabel);
  2725. ai:=Taicpu.Op_sym(A_B,hlabel);
  2726. ai.SetCondition(inverse_cond(OpCmp2AsmCond[cond]));
  2727. ai.is_jmp:=true;
  2728. list.concat(ai);
  2729. a_jmp_always(list,l);
  2730. a_label(list,hlabel);
  2731. end
  2732. else
  2733. begin
  2734. ai:=Taicpu.Op_sym(A_B,l);
  2735. ai.SetCondition(OpCmp2AsmCond[cond]);
  2736. ai.is_jmp:=true;
  2737. list.concat(ai);
  2738. end;
  2739. end;
  2740. function get_scalar_mm_op(fromsize,tosize : tcgsize) : tasmop;
  2741. const
  2742. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of tasmop = (
  2743. (A_VMOV,A_VCVT,A_NONE,A_NONE,A_NONE),
  2744. (A_VCVT,A_VMOV,A_NONE,A_NONE,A_NONE),
  2745. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2746. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2747. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE));
  2748. begin
  2749. result:=convertop[fromsize,tosize];
  2750. if result=A_NONE then
  2751. internalerror(200312205);
  2752. end;
  2753. function get_scalar_mm_prefix(fromsize,tosize : tcgsize) : TOpPostfix;
  2754. const
  2755. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of TOpPostfix = (
  2756. (PF_F32, PF_F32F64,PF_None,PF_None,PF_None),
  2757. (PF_F64F32,PF_F64, PF_None,PF_None,PF_None),
  2758. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2759. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2760. (PF_None, PF_None, PF_None,PF_None,PF_None));
  2761. begin
  2762. result:=convertop[fromsize,tosize];
  2763. end;
  2764. procedure tbasecgarm.a_loadmm_reg_reg(list: tasmlist; fromsize,tosize: tcgsize; reg1,reg2: tregister; shuffle: pmmshuffle);
  2765. var
  2766. instr: taicpu;
  2767. begin
  2768. if (shuffle=nil) or shufflescalar(shuffle) then
  2769. instr:=setoppostfix(taicpu.op_reg_reg(get_scalar_mm_op(tosize,fromsize),reg2,reg1),get_scalar_mm_prefix(tosize,fromsize))
  2770. else
  2771. internalerror(2009112407);
  2772. list.concat(instr);
  2773. case instr.opcode of
  2774. A_VMOV:
  2775. add_move_instruction(instr);
  2776. end;
  2777. end;
  2778. procedure tbasecgarm.a_loadmm_ref_reg(list: tasmlist; fromsize,tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  2779. var
  2780. intreg,
  2781. tmpmmreg : tregister;
  2782. reg64 : tregister64;
  2783. begin
  2784. if assigned(shuffle) and
  2785. not(shufflescalar(shuffle)) then
  2786. internalerror(2009112413);
  2787. case fromsize of
  2788. OS_32,OS_S32:
  2789. begin
  2790. fromsize:=OS_F32;
  2791. { since we are loading an integer, no conversion may be required }
  2792. if (fromsize<>tosize) then
  2793. internalerror(2009112801);
  2794. end;
  2795. OS_64,OS_S64:
  2796. begin
  2797. fromsize:=OS_F64;
  2798. { since we are loading an integer, no conversion may be required }
  2799. if (fromsize<>tosize) then
  2800. internalerror(2009112901);
  2801. end;
  2802. end;
  2803. if (fromsize<>tosize) then
  2804. tmpmmreg:=getmmregister(list,fromsize)
  2805. else
  2806. tmpmmreg:=reg;
  2807. if (ref.alignment in [1,2]) then
  2808. begin
  2809. case fromsize of
  2810. OS_F32:
  2811. begin
  2812. intreg:=getintregister(list,OS_32);
  2813. a_load_ref_reg(list,OS_32,OS_32,ref,intreg);
  2814. a_loadmm_intreg_reg(list,OS_32,OS_F32,intreg,tmpmmreg,mms_movescalar);
  2815. end;
  2816. OS_F64:
  2817. begin
  2818. reg64.reglo:=getintregister(list,OS_32);
  2819. reg64.reghi:=getintregister(list,OS_32);
  2820. cg64.a_load64_ref_reg(list,ref,reg64);
  2821. cg64.a_loadmm_intreg64_reg(list,OS_F64,reg64,tmpmmreg);
  2822. end;
  2823. else
  2824. internalerror(2009112412);
  2825. end;
  2826. end
  2827. else
  2828. begin
  2829. handle_load_store(list,A_VLDR,PF_None,tmpmmreg,ref);
  2830. end;
  2831. if (tmpmmreg<>reg) then
  2832. a_loadmm_reg_reg(list,fromsize,tosize,tmpmmreg,reg,shuffle);
  2833. end;
  2834. procedure tbasecgarm.a_loadmm_reg_ref(list: tasmlist; fromsize,tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  2835. var
  2836. intreg,
  2837. tmpmmreg : tregister;
  2838. reg64 : tregister64;
  2839. begin
  2840. if assigned(shuffle) and
  2841. not(shufflescalar(shuffle)) then
  2842. internalerror(2009112416);
  2843. case tosize of
  2844. OS_32,OS_S32:
  2845. begin
  2846. tosize:=OS_F32;
  2847. { since we are loading an integer, no conversion may be required }
  2848. if (fromsize<>tosize) then
  2849. internalerror(2009112801);
  2850. end;
  2851. OS_64,OS_S64:
  2852. begin
  2853. tosize:=OS_F64;
  2854. { since we are loading an integer, no conversion may be required }
  2855. if (fromsize<>tosize) then
  2856. internalerror(2009112901);
  2857. end;
  2858. end;
  2859. if (fromsize<>tosize) then
  2860. begin
  2861. tmpmmreg:=getmmregister(list,tosize);
  2862. a_loadmm_reg_reg(list,fromsize,tosize,reg,tmpmmreg,shuffle);
  2863. end
  2864. else
  2865. tmpmmreg:=reg;
  2866. if (ref.alignment in [1,2]) then
  2867. begin
  2868. case tosize of
  2869. OS_F32:
  2870. begin
  2871. intreg:=getintregister(list,OS_32);
  2872. a_loadmm_reg_intreg(list,OS_F32,OS_32,tmpmmreg,intreg,shuffle);
  2873. a_load_reg_ref(list,OS_32,OS_32,intreg,ref);
  2874. end;
  2875. OS_F64:
  2876. begin
  2877. reg64.reglo:=getintregister(list,OS_32);
  2878. reg64.reghi:=getintregister(list,OS_32);
  2879. cg64.a_loadmm_reg_intreg64(list,OS_F64,tmpmmreg,reg64);
  2880. cg64.a_load64_reg_ref(list,reg64,ref);
  2881. end;
  2882. else
  2883. internalerror(2009112417);
  2884. end;
  2885. end
  2886. else
  2887. begin
  2888. handle_load_store(list,A_VSTR,PF_None,tmpmmreg,ref);
  2889. end;
  2890. end;
  2891. procedure tbasecgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  2892. begin
  2893. { this code can only be used to transfer raw data, not to perform
  2894. conversions }
  2895. if (tosize<>OS_F32) then
  2896. internalerror(2009112419);
  2897. if not(fromsize in [OS_32,OS_S32]) then
  2898. internalerror(2009112420);
  2899. if assigned(shuffle) and
  2900. not shufflescalar(shuffle) then
  2901. internalerror(2009112516);
  2902. list.concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg));
  2903. end;
  2904. procedure tbasecgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize; mmreg, intreg: tregister;shuffle : pmmshuffle);
  2905. begin
  2906. { this code can only be used to transfer raw data, not to perform
  2907. conversions }
  2908. if (fromsize<>OS_F32) then
  2909. internalerror(2009112430);
  2910. if not(tosize in [OS_32,OS_S32]) then
  2911. internalerror(2009112420);
  2912. if assigned(shuffle) and
  2913. not shufflescalar(shuffle) then
  2914. internalerror(2009112514);
  2915. list.concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg));
  2916. end;
  2917. procedure tbasecgarm.a_opmm_reg_reg(list: tasmlist; op: topcg; size: tcgsize; src, dst: tregister; shuffle: pmmshuffle);
  2918. var
  2919. tmpreg: tregister;
  2920. begin
  2921. { the vfp doesn't support xor nor any other logical operation, but
  2922. this routine is used to initialise global mm regvars. We can
  2923. easily initialise an mm reg with 0 though. }
  2924. case op of
  2925. OP_XOR:
  2926. begin
  2927. if (src<>dst) or
  2928. (reg_cgsize(src)<>size) or
  2929. assigned(shuffle) then
  2930. internalerror(2009112907);
  2931. tmpreg:=getintregister(list,OS_32);
  2932. a_load_const_reg(list,OS_32,0,tmpreg);
  2933. case size of
  2934. OS_F32:
  2935. list.concat(taicpu.op_reg_reg(A_VMOV,dst,tmpreg));
  2936. OS_F64:
  2937. list.concat(taicpu.op_reg_reg_reg(A_VMOV,dst,tmpreg,tmpreg));
  2938. else
  2939. internalerror(2009112908);
  2940. end;
  2941. end
  2942. else
  2943. internalerror(2009112906);
  2944. end;
  2945. end;
  2946. procedure tbasecgarm.maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  2947. const
  2948. overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NEG];
  2949. begin
  2950. if (op in overflowops) and
  2951. (size in [OS_8,OS_S8,OS_16,OS_S16]) then
  2952. a_load_reg_reg(list,OS_32,size,dst,dst);
  2953. end;
  2954. procedure tbasecgarm.safe_mla(list : TAsmList; op1,op2,op3,op4 : TRegister);
  2955. procedure checkreg(var reg : TRegister);
  2956. var
  2957. tmpreg : TRegister;
  2958. begin
  2959. if ((GenerateThumbCode or GenerateThumb2Code) and (getsupreg(reg)=RS_R13)) or
  2960. (getsupreg(reg)=RS_R15) then
  2961. begin
  2962. tmpreg:=getintregister(list,OS_INT);
  2963. a_load_reg_reg(list,OS_INT,OS_INT,reg,tmpreg);
  2964. reg:=tmpreg;
  2965. end;
  2966. end;
  2967. begin
  2968. checkreg(op1);
  2969. checkreg(op2);
  2970. checkreg(op3);
  2971. checkreg(op4);
  2972. list.concat(taicpu.op_reg_reg_reg_reg(A_MLA,op1,op2,op3,op4));
  2973. end;
  2974. procedure tbasecgarm.g_maybe_tls_init(list : TAsmList);
  2975. begin
  2976. list.concat(tai_regalloc.alloc(NR_R0,nil));
  2977. a_call_name(list,'fpc_read_tp',false);
  2978. a_load_reg_reg(list,OS_ADDR,OS_ADDR,NR_R0,current_procinfo.tlsoffset);
  2979. list.concat(tai_regalloc.dealloc(NR_R0,nil));
  2980. end;
  2981. procedure tcg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  2982. begin
  2983. case op of
  2984. OP_NEG:
  2985. begin
  2986. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2987. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  2988. list.concat(taicpu.op_reg_reg_const(A_RSC,regdst.reghi,regsrc.reghi,0));
  2989. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2990. end;
  2991. OP_NOT:
  2992. begin
  2993. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  2994. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  2995. end;
  2996. else
  2997. a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);
  2998. end;
  2999. end;
  3000. procedure tcg64farm.a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);
  3001. begin
  3002. a_op64_const_reg_reg(list,op,size,value,reg,reg);
  3003. end;
  3004. procedure tcg64farm.a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);
  3005. var
  3006. ovloc : tlocation;
  3007. begin
  3008. a_op64_const_reg_reg_checkoverflow(list,op,size,value,regsrc,regdst,false,ovloc);
  3009. end;
  3010. procedure tcg64farm.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);
  3011. var
  3012. ovloc : tlocation;
  3013. begin
  3014. a_op64_reg_reg_reg_checkoverflow(list,op,size,regsrc1,regsrc2,regdst,false,ovloc);
  3015. end;
  3016. procedure tcg64farm.a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);
  3017. begin
  3018. { this code can only be used to transfer raw data, not to perform
  3019. conversions }
  3020. if (mmsize<>OS_F64) then
  3021. internalerror(2009112405);
  3022. list.concat(taicpu.op_reg_reg_reg(A_VMOV,mmreg,intreg.reglo,intreg.reghi));
  3023. end;
  3024. procedure tcg64farm.a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);
  3025. begin
  3026. { this code can only be used to transfer raw data, not to perform
  3027. conversions }
  3028. if (mmsize<>OS_F64) then
  3029. internalerror(2009112406);
  3030. list.concat(taicpu.op_reg_reg_reg(A_VMOV,intreg.reglo,intreg.reghi,mmreg));
  3031. end;
  3032. procedure tcg64farm.a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3033. var
  3034. tmpreg : tregister;
  3035. b : byte;
  3036. begin
  3037. ovloc.loc:=LOC_VOID;
  3038. case op of
  3039. OP_NEG,
  3040. OP_NOT :
  3041. internalerror(2012022501);
  3042. end;
  3043. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3044. begin
  3045. case op of
  3046. OP_ADD:
  3047. begin
  3048. if is_shifter_const(lo(value),b) then
  3049. begin
  3050. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3051. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3052. end
  3053. else
  3054. begin
  3055. tmpreg:=cg.getintregister(list,OS_32);
  3056. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3057. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3058. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3059. end;
  3060. if is_shifter_const(hi(value),b) then
  3061. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,hi(value)),PF_S))
  3062. else
  3063. begin
  3064. tmpreg:=cg.getintregister(list,OS_32);
  3065. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3066. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3067. end;
  3068. end;
  3069. OP_SUB:
  3070. begin
  3071. if is_shifter_const(lo(value),b) then
  3072. begin
  3073. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3074. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3075. end
  3076. else
  3077. begin
  3078. tmpreg:=cg.getintregister(list,OS_32);
  3079. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3080. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3081. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3082. end;
  3083. if is_shifter_const(hi(value),b) then
  3084. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))),PF_S))
  3085. else
  3086. begin
  3087. tmpreg:=cg.getintregister(list,OS_32);
  3088. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3089. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3090. end;
  3091. end;
  3092. else
  3093. internalerror(200502131);
  3094. end;
  3095. if size=OS_64 then
  3096. begin
  3097. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3098. ovloc.loc:=LOC_FLAGS;
  3099. case op of
  3100. OP_ADD:
  3101. ovloc.resflags:=F_CS;
  3102. OP_SUB:
  3103. ovloc.resflags:=F_CC;
  3104. end;
  3105. end;
  3106. end
  3107. else
  3108. begin
  3109. case op of
  3110. OP_AND,OP_OR,OP_XOR:
  3111. begin
  3112. cg.a_op_const_reg_reg(list,op,OS_32,aint(lo(value)),regsrc.reglo,regdst.reglo);
  3113. cg.a_op_const_reg_reg(list,op,OS_32,aint(hi(value)),regsrc.reghi,regdst.reghi);
  3114. end;
  3115. OP_ADD:
  3116. begin
  3117. if is_shifter_const(aint(lo(value)),b) then
  3118. begin
  3119. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3120. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3121. end
  3122. else
  3123. begin
  3124. tmpreg:=cg.getintregister(list,OS_32);
  3125. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3126. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3127. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3128. end;
  3129. if is_shifter_const(aint(hi(value)),b) then
  3130. list.concat(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3131. else
  3132. begin
  3133. tmpreg:=cg.getintregister(list,OS_32);
  3134. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  3135. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg));
  3136. end;
  3137. end;
  3138. OP_SUB:
  3139. begin
  3140. if is_shifter_const(aint(lo(value)),b) then
  3141. begin
  3142. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3143. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3144. end
  3145. else
  3146. begin
  3147. tmpreg:=cg.getintregister(list,OS_32);
  3148. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3149. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3150. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3151. end;
  3152. if is_shifter_const(aint(hi(value)),b) then
  3153. list.concat(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3154. else
  3155. begin
  3156. tmpreg:=cg.getintregister(list,OS_32);
  3157. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3158. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg));
  3159. end;
  3160. end;
  3161. else
  3162. internalerror(2003083101);
  3163. end;
  3164. end;
  3165. end;
  3166. procedure tcg64farm.a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3167. begin
  3168. ovloc.loc:=LOC_VOID;
  3169. case op of
  3170. OP_NEG,
  3171. OP_NOT :
  3172. internalerror(2012022502);
  3173. end;
  3174. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3175. begin
  3176. case op of
  3177. OP_ADD:
  3178. begin
  3179. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3180. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3181. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi),PF_S));
  3182. end;
  3183. OP_SUB:
  3184. begin
  3185. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3186. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3187. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi),PF_S));
  3188. end;
  3189. else
  3190. internalerror(2003083101);
  3191. end;
  3192. if size=OS_64 then
  3193. begin
  3194. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3195. ovloc.loc:=LOC_FLAGS;
  3196. case op of
  3197. OP_ADD:
  3198. ovloc.resflags:=F_CS;
  3199. OP_SUB:
  3200. ovloc.resflags:=F_CC;
  3201. end;
  3202. end;
  3203. end
  3204. else
  3205. begin
  3206. case op of
  3207. OP_AND,OP_OR,OP_XOR:
  3208. begin
  3209. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);
  3210. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);
  3211. end;
  3212. OP_ADD:
  3213. begin
  3214. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3215. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3216. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi));
  3217. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3218. end;
  3219. OP_SUB:
  3220. begin
  3221. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3222. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3223. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi));
  3224. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3225. end;
  3226. else
  3227. internalerror(2003083101);
  3228. end;
  3229. end;
  3230. end;
  3231. procedure tthumbcgarm.init_register_allocators;
  3232. begin
  3233. inherited init_register_allocators;
  3234. if assigned(current_procinfo) and (current_procinfo.framepointer=NR_R7) then
  3235. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3236. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6],first_int_imreg,[])
  3237. else
  3238. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3239. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7],first_int_imreg,[]);
  3240. end;
  3241. procedure tthumbcgarm.done_register_allocators;
  3242. begin
  3243. rg[R_INTREGISTER].free;
  3244. rg[R_FPUREGISTER].free;
  3245. rg[R_MMREGISTER].free;
  3246. inherited done_register_allocators;
  3247. end;
  3248. procedure tthumbcgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  3249. var
  3250. ref : treference;
  3251. r : byte;
  3252. regs : tcpuregisterset;
  3253. stackmisalignment : pint;
  3254. registerarea: DWord;
  3255. stack_parameters: Boolean;
  3256. begin
  3257. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3258. LocalSize:=align(LocalSize,4);
  3259. { call instruction does not put anything on the stack }
  3260. stackmisalignment:=0;
  3261. if not(nostackframe) then
  3262. begin
  3263. a_reg_alloc(list,NR_STACK_POINTER_REG);
  3264. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3265. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  3266. { save int registers }
  3267. reference_reset(ref,4,[]);
  3268. ref.index:=NR_STACK_POINTER_REG;
  3269. ref.addressmode:=AM_PREINDEXED;
  3270. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3271. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3272. begin
  3273. //!!!! a_reg_alloc(list,NR_R12);
  3274. //!!!! list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  3275. end;
  3276. { the (old) ARM APCS requires saving both the stack pointer (to
  3277. crawl the stack) and the PC (to identify the function this
  3278. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  3279. and R15 -- still needs updating for EABI and Darwin, they don't
  3280. need that }
  3281. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3282. regs:=regs+[RS_R7,RS_R14]
  3283. else
  3284. // if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  3285. include(regs,RS_R14);
  3286. { safely estimate stack size }
  3287. if localsize+current_settings.alignment.localalignmax+4>508 then
  3288. begin
  3289. include(rg[R_INTREGISTER].used_in_proc,RS_R4);
  3290. include(regs,RS_R4);
  3291. end;
  3292. registerarea:=0;
  3293. if regs<>[] then
  3294. begin
  3295. for r:=RS_R0 to RS_R15 do
  3296. if r in regs then
  3297. inc(registerarea,4);
  3298. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,regs));
  3299. end;
  3300. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3301. if stack_parameters or (LocalSize<>0) or
  3302. ((stackmisalignment<>0) and
  3303. ((pi_do_call in current_procinfo.flags) or
  3304. (po_assembler in current_procinfo.procdef.procoptions))) then
  3305. begin
  3306. { do we access stack parameters?
  3307. if yes, the previously estimated stacksize must be used }
  3308. if stack_parameters then
  3309. begin
  3310. if localsize>tcpuprocinfo(current_procinfo).stackframesize then
  3311. begin
  3312. writeln(localsize);
  3313. writeln(tcpuprocinfo(current_procinfo).stackframesize);
  3314. internalerror(2013040601);
  3315. end
  3316. else
  3317. localsize:=tcpuprocinfo(current_procinfo).stackframesize-registerarea;
  3318. end
  3319. else
  3320. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3321. if localsize<508 then
  3322. begin
  3323. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  3324. end
  3325. else if localsize<=1016 then
  3326. begin
  3327. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3328. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize-508));
  3329. end
  3330. else
  3331. begin
  3332. a_load_const_reg(list,OS_ADDR,-localsize,NR_R4);
  3333. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R4));
  3334. include(regs,RS_R4);
  3335. //!!!! if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  3336. //!!!! a_reg_alloc(list,NR_R12);
  3337. //!!!! a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  3338. //!!!! list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  3339. //!!!! a_reg_dealloc(list,NR_R12);
  3340. end;
  3341. end;
  3342. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3343. begin
  3344. list.concat(taicpu.op_reg_reg_const(A_ADD,current_procinfo.framepointer,NR_STACK_POINTER_REG,0));
  3345. end;
  3346. end;
  3347. end;
  3348. procedure tthumbcgarm.g_proc_exit(list: TAsmList; parasize: longint; nostackframe: boolean);
  3349. var
  3350. LocalSize : longint;
  3351. r: byte;
  3352. regs : tcpuregisterset;
  3353. registerarea : DWord;
  3354. stackmisalignment: pint;
  3355. stack_parameters : Boolean;
  3356. begin
  3357. if not(nostackframe) then
  3358. begin
  3359. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3360. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3361. include(regs,RS_R15);
  3362. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3363. include(regs,getsupreg(current_procinfo.framepointer));
  3364. registerarea:=0;
  3365. for r:=RS_R0 to RS_R15 do
  3366. if r in regs then
  3367. inc(registerarea,4);
  3368. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3369. LocalSize:=current_procinfo.calc_stackframe_size;
  3370. if stack_parameters then
  3371. localsize:=tcpuprocinfo(current_procinfo).stackframesize-registerarea
  3372. else
  3373. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3374. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  3375. (target_info.system in systems_darwin) then
  3376. begin
  3377. if (LocalSize<>0) or
  3378. ((stackmisalignment<>0) and
  3379. ((pi_do_call in current_procinfo.flags) or
  3380. (po_assembler in current_procinfo.procdef.procoptions))) then
  3381. begin
  3382. if LocalSize=0 then
  3383. else if LocalSize<=508 then
  3384. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  3385. else if LocalSize<=1016 then
  3386. begin
  3387. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3388. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,localsize-508));
  3389. end
  3390. else
  3391. begin
  3392. a_reg_alloc(list,NR_R3);
  3393. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R3);
  3394. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R3));
  3395. a_reg_dealloc(list,NR_R3);
  3396. end;
  3397. end;
  3398. if regs=[] then
  3399. begin
  3400. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3401. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3402. else
  3403. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3404. end
  3405. else
  3406. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,regs));
  3407. end;
  3408. end
  3409. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3410. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3411. else
  3412. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3413. end;
  3414. procedure tthumbcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3415. var
  3416. oppostfix:toppostfix;
  3417. usedtmpref: treference;
  3418. tmpreg,tmpreg2 : tregister;
  3419. dir : integer;
  3420. begin
  3421. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3422. FromSize := ToSize;
  3423. case FromSize of
  3424. { signed integer registers }
  3425. OS_8:
  3426. oppostfix:=PF_B;
  3427. OS_S8:
  3428. oppostfix:=PF_SB;
  3429. OS_16:
  3430. oppostfix:=PF_H;
  3431. OS_S16:
  3432. oppostfix:=PF_SH;
  3433. OS_32,
  3434. OS_S32:
  3435. oppostfix:=PF_None;
  3436. else
  3437. InternalError(200308298);
  3438. end;
  3439. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3440. begin
  3441. if target_info.endian=endian_big then
  3442. dir:=-1
  3443. else
  3444. dir:=1;
  3445. case FromSize of
  3446. OS_16,OS_S16:
  3447. begin
  3448. { only complicated references need an extra loadaddr }
  3449. if assigned(ref.symbol) or
  3450. (ref.index<>NR_NO) or
  3451. (ref.offset<-124) or
  3452. (ref.offset>124) or
  3453. { sometimes the compiler reused registers }
  3454. (reg=ref.index) or
  3455. (reg=ref.base) then
  3456. begin
  3457. tmpreg2:=getintregister(list,OS_INT);
  3458. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3459. reference_reset_base(usedtmpref,tmpreg2,0,ref.temppos,ref.alignment,ref.volatility);
  3460. end
  3461. else
  3462. usedtmpref:=ref;
  3463. if target_info.endian=endian_big then
  3464. inc(usedtmpref.offset,1);
  3465. tmpreg:=getintregister(list,OS_INT);
  3466. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3467. inc(usedtmpref.offset,dir);
  3468. if FromSize=OS_16 then
  3469. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3470. else
  3471. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3472. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3473. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3474. end;
  3475. OS_32,OS_S32:
  3476. begin
  3477. tmpreg:=getintregister(list,OS_INT);
  3478. { only complicated references need an extra loadaddr }
  3479. if assigned(ref.symbol) or
  3480. (ref.index<>NR_NO) or
  3481. (ref.offset<-124) or
  3482. (ref.offset>124) or
  3483. { sometimes the compiler reused registers }
  3484. (reg=ref.index) or
  3485. (reg=ref.base) then
  3486. begin
  3487. tmpreg2:=getintregister(list,OS_INT);
  3488. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3489. reference_reset_base(usedtmpref,tmpreg2,0,ref.temppos,ref.alignment,ref.volatility);
  3490. end
  3491. else
  3492. usedtmpref:=ref;
  3493. if ref.alignment=2 then
  3494. begin
  3495. if target_info.endian=endian_big then
  3496. inc(usedtmpref.offset,2);
  3497. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  3498. inc(usedtmpref.offset,dir*2);
  3499. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  3500. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3501. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3502. end
  3503. else
  3504. begin
  3505. if target_info.endian=endian_big then
  3506. inc(usedtmpref.offset,3);
  3507. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3508. inc(usedtmpref.offset,dir);
  3509. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3510. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3511. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3512. inc(usedtmpref.offset,dir);
  3513. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3514. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3515. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3516. inc(usedtmpref.offset,dir);
  3517. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3518. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,24));
  3519. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3520. end;
  3521. end
  3522. else
  3523. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3524. end;
  3525. end
  3526. else
  3527. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3528. if (fromsize=OS_S8) and (tosize = OS_16) then
  3529. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  3530. end;
  3531. procedure tthumbcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3532. var
  3533. l : tasmlabel;
  3534. hr : treference;
  3535. begin
  3536. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3537. internalerror(2002090902);
  3538. if is_thumb_imm(a) then
  3539. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3540. else
  3541. begin
  3542. reference_reset(hr,4,[]);
  3543. current_asmdata.getjumplabel(l);
  3544. cg.a_label(current_procinfo.aktlocaldata,l);
  3545. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3546. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3547. hr.symbol:=l;
  3548. hr.base:=NR_PC;
  3549. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3550. end;
  3551. end;
  3552. procedure tthumbcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  3553. var
  3554. hsym : tsym;
  3555. href,
  3556. tmpref : treference;
  3557. paraloc : Pcgparalocation;
  3558. l : TAsmLabel;
  3559. begin
  3560. { calculate the parameter info for the procdef }
  3561. procdef.init_paraloc_info(callerside);
  3562. hsym:=tsym(procdef.parast.Find('self'));
  3563. if not(assigned(hsym) and
  3564. (hsym.typ=paravarsym)) then
  3565. internalerror(200305251);
  3566. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  3567. while paraloc<>nil do
  3568. with paraloc^ do
  3569. begin
  3570. case loc of
  3571. LOC_REGISTER:
  3572. begin
  3573. if is_thumb_imm(ioffset) then
  3574. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  3575. else
  3576. begin
  3577. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3578. reference_reset(tmpref,4,[]);
  3579. current_asmdata.getjumplabel(l);
  3580. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3581. cg.a_label(current_procinfo.aktlocaldata,l);
  3582. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3583. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3584. tmpref.symbol:=l;
  3585. tmpref.base:=NR_PC;
  3586. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3587. a_op_reg_reg(list,OP_SUB,size,NR_R4,register);
  3588. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3589. end;
  3590. end;
  3591. LOC_REFERENCE:
  3592. begin
  3593. { offset in the wrapper needs to be adjusted for the stored
  3594. return address }
  3595. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),ctempposinvalid,sizeof(pint),[]);
  3596. if is_thumb_imm(ioffset) then
  3597. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  3598. else
  3599. begin
  3600. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3601. reference_reset(tmpref,4,[]);
  3602. current_asmdata.getjumplabel(l);
  3603. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3604. cg.a_label(current_procinfo.aktlocaldata,l);
  3605. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3606. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3607. tmpref.symbol:=l;
  3608. tmpref.base:=NR_PC;
  3609. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3610. a_op_reg_ref(list,OP_SUB,size,NR_R4,href);
  3611. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3612. end;
  3613. end
  3614. else
  3615. internalerror(200309189);
  3616. end;
  3617. paraloc:=next;
  3618. end;
  3619. end;
  3620. function tthumbcgarm.handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference;
  3621. var
  3622. href : treference;
  3623. tmpreg : TRegister;
  3624. begin
  3625. href:=ref;
  3626. if { LDR/STR limitations }
  3627. (
  3628. (((op=A_LDR) and (oppostfix=PF_None)) or
  3629. ((op=A_STR) and (oppostfix=PF_None))) and
  3630. (ref.base<>NR_STACK_POINTER_REG) and
  3631. (abs(ref.offset)>124)
  3632. ) or
  3633. { LDRB/STRB limitations }
  3634. (
  3635. (((op=A_LDR) and (oppostfix=PF_B)) or
  3636. ((op=A_LDRB) and (oppostfix=PF_None)) or
  3637. ((op=A_STR) and (oppostfix=PF_B)) or
  3638. ((op=A_STRB) and (oppostfix=PF_None))) and
  3639. ((ref.base=NR_STACK_POINTER_REG) or
  3640. (ref.index=NR_STACK_POINTER_REG) or
  3641. (abs(ref.offset)>31)
  3642. )
  3643. ) or
  3644. { LDRH/STRH limitations }
  3645. (
  3646. (((op=A_LDR) and (oppostfix=PF_H)) or
  3647. ((op=A_LDRH) and (oppostfix=PF_None)) or
  3648. ((op=A_STR) and (oppostfix=PF_H)) or
  3649. ((op=A_STRH) and (oppostfix=PF_None))) and
  3650. ((ref.base=NR_STACK_POINTER_REG) or
  3651. (ref.index=NR_STACK_POINTER_REG) or
  3652. (abs(ref.offset)>62) or
  3653. ((abs(ref.offset) mod 2)<>0)
  3654. )
  3655. ) then
  3656. begin
  3657. tmpreg:=getintregister(list,OS_ADDR);
  3658. a_loadaddr_ref_reg(list,ref,tmpreg);
  3659. reference_reset_base(href,tmpreg,0,ref.temppos,ref.alignment,ref.volatility);
  3660. end
  3661. else if (op=A_LDR) and
  3662. (oppostfix in [PF_None]) and
  3663. (ref.base=NR_STACK_POINTER_REG) and
  3664. (abs(ref.offset)>1020) then
  3665. begin
  3666. tmpreg:=getintregister(list,OS_ADDR);
  3667. a_loadaddr_ref_reg(list,ref,tmpreg);
  3668. reference_reset_base(href,tmpreg,0,ref.temppos,ref.alignment,ref.volatility);
  3669. end
  3670. else if (op=A_LDR) and
  3671. ((oppostfix in [PF_SH,PF_SB]) or
  3672. (abs(ref.offset)>124)) then
  3673. begin
  3674. tmpreg:=getintregister(list,OS_ADDR);
  3675. a_loadaddr_ref_reg(list,ref,tmpreg);
  3676. reference_reset_base(href,tmpreg,0,ref.temppos,ref.alignment,ref.volatility);
  3677. end;
  3678. Result:=inherited handle_load_store(list, op, oppostfix, reg, href);
  3679. end;
  3680. procedure tthumbcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  3681. var
  3682. tmpreg : tregister;
  3683. begin
  3684. case op of
  3685. OP_NEG:
  3686. list.concat(taicpu.op_reg_reg(A_NEG,dst,src));
  3687. OP_NOT:
  3688. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  3689. OP_DIV,OP_IDIV:
  3690. internalerror(200308284);
  3691. OP_ROL:
  3692. begin
  3693. if not(size in [OS_32,OS_S32]) then
  3694. internalerror(2008072801);
  3695. { simulate ROL by ror'ing 32-value }
  3696. tmpreg:=getintregister(list,OS_32);
  3697. a_load_const_reg(list,OS_32,32,tmpreg);
  3698. list.concat(taicpu.op_reg_reg(A_SUB,tmpreg,src));
  3699. list.concat(taicpu.op_reg_reg(A_ROR,dst,src));
  3700. end;
  3701. else
  3702. begin
  3703. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3704. list.concat(setoppostfix(
  3705. taicpu.op_reg_reg(op_reg_opcg2asmop[op],dst,src),op_reg_postfix[op]));
  3706. end;
  3707. end;
  3708. maybeadjustresult(list,op,size,dst);
  3709. end;
  3710. procedure tthumbcgarm.a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);
  3711. var
  3712. tmpreg : tregister;
  3713. {$ifdef DUMMY}
  3714. l1 : longint;
  3715. {$endif DUMMY}
  3716. begin
  3717. //!!! ovloc.loc:=LOC_VOID;
  3718. if {$ifopt R+}(a<>-2147483648) and{$endif} {!!!!!! not setflags and } is_thumb_imm(-a) then
  3719. case op of
  3720. OP_ADD:
  3721. begin
  3722. op:=OP_SUB;
  3723. a:=aint(dword(-a));
  3724. end;
  3725. OP_SUB:
  3726. begin
  3727. op:=OP_ADD;
  3728. a:=aint(dword(-a));
  3729. end
  3730. end;
  3731. if is_thumb_imm(a) and (op in [OP_ADD,OP_SUB]) then
  3732. begin
  3733. // if cgsetflags or setflags then
  3734. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3735. list.concat(setoppostfix(
  3736. taicpu.op_reg_const(op_reg_opcg2asmop[op],dst,a),op_reg_postfix[op]));
  3737. if (cgsetflags {!!! or setflags }) and (size in [OS_8,OS_16,OS_32]) then
  3738. begin
  3739. //!!! ovloc.loc:=LOC_FLAGS;
  3740. case op of
  3741. OP_ADD:
  3742. //!!! ovloc.resflags:=F_CS;
  3743. ;
  3744. OP_SUB:
  3745. //!!! ovloc.resflags:=F_CC;
  3746. ;
  3747. end;
  3748. end;
  3749. end
  3750. else
  3751. begin
  3752. { there could be added some more sophisticated optimizations }
  3753. if (op in [OP_MUL,OP_IMUL,OP_DIV,OP_IDIV]) and (a=1) then
  3754. a_load_reg_reg(list,size,size,dst,dst)
  3755. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  3756. a_load_const_reg(list,size,0,dst)
  3757. else if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  3758. a_op_reg_reg(list,OP_NEG,size,dst,dst)
  3759. { we do this here instead in the peephole optimizer because
  3760. it saves us a register }
  3761. {$ifdef DUMMY}
  3762. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  3763. a_op_const_reg_reg(list,OP_SHL,size,l1,dst,dst)
  3764. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  3765. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  3766. begin
  3767. if l1>32 then{roozbeh does this ever happen?}
  3768. internalerror(200308296);
  3769. shifterop_reset(so);
  3770. so.shiftmode:=SM_LSL;
  3771. so.shiftimm:=l1;
  3772. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,dst,so));
  3773. end
  3774. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  3775. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  3776. begin
  3777. if l1>32 then{does this ever happen?}
  3778. internalerror(201205181);
  3779. shifterop_reset(so);
  3780. so.shiftmode:=SM_LSL;
  3781. so.shiftimm:=l1;
  3782. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,dst,dst,so));
  3783. end
  3784. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,dst,dst) then
  3785. begin
  3786. { nothing to do on success }
  3787. end
  3788. {$endif DUMMY}
  3789. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  3790. Just using mov x, #0 might allow some easier optimizations down the line. }
  3791. else if (op = OP_AND) and (dword(a)=0) then
  3792. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  3793. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  3794. else if (op = OP_AND) and (not(dword(a))=0) then
  3795. // do nothing
  3796. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  3797. broader range of shifterconstants.}
  3798. {$ifdef DUMMY}
  3799. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  3800. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,not(dword(a))))
  3801. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  3802. begin
  3803. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm1));
  3804. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  3805. end
  3806. else if (op in [OP_ADD, OP_SUB, OP_OR]) and
  3807. not(cgsetflags or setflags) and
  3808. split_into_shifter_const(a, imm1, imm2) then
  3809. begin
  3810. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm1));
  3811. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  3812. end
  3813. {$endif DUMMY}
  3814. else if (op in [OP_SHL, OP_SHR, OP_SAR]) then
  3815. begin
  3816. list.concat(taicpu.op_reg_reg_const(op_reg_opcg2asmop[op],dst,dst,a));
  3817. end
  3818. else
  3819. begin
  3820. tmpreg:=getintregister(list,size);
  3821. a_load_const_reg(list,size,a,tmpreg);
  3822. a_op_reg_reg(list,op,size,tmpreg,dst);
  3823. end;
  3824. end;
  3825. maybeadjustresult(list,op,size,dst);
  3826. end;
  3827. procedure tthumbcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister);
  3828. begin
  3829. if (op=OP_ADD) and (src=NR_R13) and (dst<>NR_R13) and ((a mod 4)=0) and (a>0) and (a<=1020) then
  3830. list.concat(taicpu.op_reg_reg_const(A_ADD,dst,src,a))
  3831. else
  3832. inherited a_op_const_reg_reg(list,op,size,a,src,dst);
  3833. end;
  3834. procedure tthumbcgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  3835. var
  3836. l1,l2 : tasmlabel;
  3837. ai : taicpu;
  3838. begin
  3839. current_asmdata.getjumplabel(l1);
  3840. current_asmdata.getjumplabel(l2);
  3841. ai:=setcondition(taicpu.op_sym(A_B,l1),flags_to_cond(f));
  3842. ai.is_jmp:=true;
  3843. list.concat(ai);
  3844. list.concat(taicpu.op_reg_const(A_MOV,reg,0));
  3845. list.concat(taicpu.op_sym(A_B,l2));
  3846. cg.a_label(list,l1);
  3847. list.concat(taicpu.op_reg_const(A_MOV,reg,1));
  3848. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3849. cg.a_label(list,l2);
  3850. end;
  3851. procedure tthumb2cgarm.init_register_allocators;
  3852. begin
  3853. inherited init_register_allocators;
  3854. { currently, we save R14 always, so we can use it }
  3855. if (target_info.system<>system_arm_darwin) then
  3856. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3857. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3858. RS_R9,RS_R10,RS_R12,RS_R14],first_int_imreg,[])
  3859. else
  3860. { r9 is not available on Darwin according to the llvm code generator }
  3861. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3862. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3863. RS_R10,RS_R12,RS_R14],first_int_imreg,[]);
  3864. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  3865. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  3866. if current_settings.fputype in [fpu_vfpv3,fpu_vfpv4] then
  3867. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3868. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3869. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  3870. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3871. ],first_mm_imreg,[])
  3872. else if current_settings.fputype in [fpu_fpv4_s16,fpu_vfpv3_d16] then
  3873. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3874. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3875. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3876. ],first_mm_imreg,[])
  3877. else
  3878. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBNONE,
  3879. [RS_S0,RS_S1,RS_R2,RS_R3,RS_R4,RS_S31],first_mm_imreg,[]);
  3880. end;
  3881. procedure tthumb2cgarm.done_register_allocators;
  3882. begin
  3883. rg[R_INTREGISTER].free;
  3884. rg[R_FPUREGISTER].free;
  3885. rg[R_MMREGISTER].free;
  3886. inherited done_register_allocators;
  3887. end;
  3888. procedure tthumb2cgarm.a_call_reg(list : TAsmList;reg: tregister);
  3889. begin
  3890. list.concat(taicpu.op_reg(A_BLX, reg));
  3891. {
  3892. the compiler does not properly set this flag anymore in pass 1, and
  3893. for now we only need it after pass 2 (I hope) (JM)
  3894. if not(pi_do_call in current_procinfo.flags) then
  3895. internalerror(2003060703);
  3896. }
  3897. include(current_procinfo.flags,pi_do_call);
  3898. end;
  3899. procedure tthumb2cgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3900. var
  3901. l : tasmlabel;
  3902. hr : treference;
  3903. begin
  3904. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3905. internalerror(2002090902);
  3906. if is_thumb32_imm(a) then
  3907. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3908. else if is_thumb32_imm(not(a)) then
  3909. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  3910. else if (a and $FFFF)=a then
  3911. list.concat(taicpu.op_reg_const(A_MOVW,reg,a))
  3912. else
  3913. begin
  3914. reference_reset(hr,4,[]);
  3915. current_asmdata.getjumplabel(l);
  3916. cg.a_label(current_procinfo.aktlocaldata,l);
  3917. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3918. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3919. hr.symbol:=l;
  3920. hr.base:=NR_PC;
  3921. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3922. end;
  3923. end;
  3924. procedure tthumb2cgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3925. var
  3926. oppostfix:toppostfix;
  3927. usedtmpref: treference;
  3928. tmpreg,tmpreg2 : tregister;
  3929. so : tshifterop;
  3930. dir : integer;
  3931. begin
  3932. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3933. FromSize := ToSize;
  3934. case FromSize of
  3935. { signed integer registers }
  3936. OS_8:
  3937. oppostfix:=PF_B;
  3938. OS_S8:
  3939. oppostfix:=PF_SB;
  3940. OS_16:
  3941. oppostfix:=PF_H;
  3942. OS_S16:
  3943. oppostfix:=PF_SH;
  3944. OS_32,
  3945. OS_S32:
  3946. oppostfix:=PF_None;
  3947. else
  3948. InternalError(200308299);
  3949. end;
  3950. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3951. begin
  3952. if target_info.endian=endian_big then
  3953. dir:=-1
  3954. else
  3955. dir:=1;
  3956. case FromSize of
  3957. OS_16,OS_S16:
  3958. begin
  3959. { only complicated references need an extra loadaddr }
  3960. if assigned(ref.symbol) or
  3961. (ref.index<>NR_NO) or
  3962. (ref.offset<-255) or
  3963. (ref.offset>4094) or
  3964. { sometimes the compiler reused registers }
  3965. (reg=ref.index) or
  3966. (reg=ref.base) then
  3967. begin
  3968. tmpreg2:=getintregister(list,OS_INT);
  3969. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3970. reference_reset_base(usedtmpref,tmpreg2,0,ref.temppos,ref.alignment,ref.volatility);
  3971. end
  3972. else
  3973. usedtmpref:=ref;
  3974. if target_info.endian=endian_big then
  3975. inc(usedtmpref.offset,1);
  3976. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  3977. tmpreg:=getintregister(list,OS_INT);
  3978. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3979. inc(usedtmpref.offset,dir);
  3980. if FromSize=OS_16 then
  3981. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3982. else
  3983. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3984. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  3985. end;
  3986. OS_32,OS_S32:
  3987. begin
  3988. tmpreg:=getintregister(list,OS_INT);
  3989. { only complicated references need an extra loadaddr }
  3990. if assigned(ref.symbol) or
  3991. (ref.index<>NR_NO) or
  3992. (ref.offset<-255) or
  3993. (ref.offset>4092) or
  3994. { sometimes the compiler reused registers }
  3995. (reg=ref.index) or
  3996. (reg=ref.base) then
  3997. begin
  3998. tmpreg2:=getintregister(list,OS_INT);
  3999. a_loadaddr_ref_reg(list,ref,tmpreg2);
  4000. reference_reset_base(usedtmpref,tmpreg2,0,ref.temppos,ref.alignment,ref.volatility);
  4001. end
  4002. else
  4003. usedtmpref:=ref;
  4004. shifterop_reset(so);so.shiftmode:=SM_LSL;
  4005. if ref.alignment=2 then
  4006. begin
  4007. if target_info.endian=endian_big then
  4008. inc(usedtmpref.offset,2);
  4009. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  4010. inc(usedtmpref.offset,dir*2);
  4011. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  4012. so.shiftimm:=16;
  4013. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4014. end
  4015. else
  4016. begin
  4017. if target_info.endian=endian_big then
  4018. inc(usedtmpref.offset,3);
  4019. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  4020. inc(usedtmpref.offset,dir);
  4021. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4022. so.shiftimm:=8;
  4023. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4024. inc(usedtmpref.offset,dir);
  4025. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4026. so.shiftimm:=16;
  4027. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4028. inc(usedtmpref.offset,dir);
  4029. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4030. so.shiftimm:=24;
  4031. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4032. end;
  4033. end
  4034. else
  4035. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4036. end;
  4037. end
  4038. else
  4039. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4040. if (fromsize=OS_S8) and (tosize = OS_16) then
  4041. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  4042. end;
  4043. procedure tthumb2cgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  4044. begin
  4045. if op = OP_NOT then
  4046. begin
  4047. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  4048. case size of
  4049. OS_8: list.concat(taicpu.op_reg_reg(A_UXTB,dst,dst));
  4050. OS_S8: list.concat(taicpu.op_reg_reg(A_SXTB,dst,dst));
  4051. OS_16: list.concat(taicpu.op_reg_reg(A_UXTH,dst,dst));
  4052. OS_S16: list.concat(taicpu.op_reg_reg(A_SXTH,dst,dst));
  4053. end;
  4054. end
  4055. else
  4056. inherited a_op_reg_reg(list, op, size, src, dst);
  4057. end;
  4058. procedure tthumb2cgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4059. var
  4060. shift, width : byte;
  4061. tmpreg : tregister;
  4062. so : tshifterop;
  4063. l1 : longint;
  4064. begin
  4065. ovloc.loc:=LOC_VOID;
  4066. if {$ifopt R+}(a<>-2147483648) and{$endif} is_shifter_const(-a,shift) then
  4067. case op of
  4068. OP_ADD:
  4069. begin
  4070. op:=OP_SUB;
  4071. a:=aint(dword(-a));
  4072. end;
  4073. OP_SUB:
  4074. begin
  4075. op:=OP_ADD;
  4076. a:=aint(dword(-a));
  4077. end
  4078. end;
  4079. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  4080. case op of
  4081. OP_NEG,OP_NOT,
  4082. OP_DIV,OP_IDIV:
  4083. internalerror(200308285);
  4084. OP_SHL:
  4085. begin
  4086. if a>32 then
  4087. internalerror(2014020703);
  4088. if a<>0 then
  4089. begin
  4090. shifterop_reset(so);
  4091. so.shiftmode:=SM_LSL;
  4092. so.shiftimm:=a;
  4093. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4094. end
  4095. else
  4096. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4097. end;
  4098. OP_ROL:
  4099. begin
  4100. if a>32 then
  4101. internalerror(2014020704);
  4102. if a<>0 then
  4103. begin
  4104. shifterop_reset(so);
  4105. so.shiftmode:=SM_ROR;
  4106. so.shiftimm:=32-a;
  4107. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4108. end
  4109. else
  4110. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4111. end;
  4112. OP_ROR:
  4113. begin
  4114. if a>32 then
  4115. internalerror(2014020705);
  4116. if a<>0 then
  4117. begin
  4118. shifterop_reset(so);
  4119. so.shiftmode:=SM_ROR;
  4120. so.shiftimm:=a;
  4121. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4122. end
  4123. else
  4124. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4125. end;
  4126. OP_SHR:
  4127. begin
  4128. if a>32 then
  4129. internalerror(200308292);
  4130. shifterop_reset(so);
  4131. if a<>0 then
  4132. begin
  4133. so.shiftmode:=SM_LSR;
  4134. so.shiftimm:=a;
  4135. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4136. end
  4137. else
  4138. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4139. end;
  4140. OP_SAR:
  4141. begin
  4142. if a>32 then
  4143. internalerror(200308295);
  4144. if a<>0 then
  4145. begin
  4146. shifterop_reset(so);
  4147. so.shiftmode:=SM_ASR;
  4148. so.shiftimm:=a;
  4149. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4150. end
  4151. else
  4152. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4153. end;
  4154. else
  4155. if (op in [OP_SUB, OP_ADD]) and
  4156. ((a < 0) or
  4157. (a > 4095)) then
  4158. begin
  4159. tmpreg:=getintregister(list,size);
  4160. a_load_const_reg(list, size, a, tmpreg);
  4161. if cgsetflags or setflags then
  4162. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4163. list.concat(setoppostfix(
  4164. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4165. end
  4166. else
  4167. begin
  4168. if cgsetflags or setflags then
  4169. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4170. list.concat(setoppostfix(
  4171. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4172. end;
  4173. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  4174. begin
  4175. ovloc.loc:=LOC_FLAGS;
  4176. case op of
  4177. OP_ADD:
  4178. ovloc.resflags:=F_CS;
  4179. OP_SUB:
  4180. ovloc.resflags:=F_CC;
  4181. end;
  4182. end;
  4183. end
  4184. else
  4185. begin
  4186. { there could be added some more sophisticated optimizations }
  4187. if (op in [OP_MUL,OP_IMUL]) and (a=1) then
  4188. a_load_reg_reg(list,size,size,src,dst)
  4189. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  4190. a_load_const_reg(list,size,0,dst)
  4191. else if (op in [OP_IMUL]) and (a=-1) then
  4192. a_op_reg_reg(list,OP_NEG,size,src,dst)
  4193. { we do this here instead in the peephole optimizer because
  4194. it saves us a register }
  4195. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  4196. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  4197. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  4198. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  4199. begin
  4200. if l1>32 then{roozbeh does this ever happen?}
  4201. internalerror(200308296);
  4202. shifterop_reset(so);
  4203. so.shiftmode:=SM_LSL;
  4204. so.shiftimm:=l1;
  4205. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  4206. end
  4207. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  4208. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  4209. begin
  4210. if l1>32 then{does this ever happen?}
  4211. internalerror(201205181);
  4212. shifterop_reset(so);
  4213. so.shiftmode:=SM_LSL;
  4214. so.shiftimm:=l1;
  4215. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  4216. end
  4217. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  4218. begin
  4219. { nothing to do on success }
  4220. end
  4221. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  4222. Just using mov x, #0 might allow some easier optimizations down the line. }
  4223. else if (op = OP_AND) and (dword(a)=0) then
  4224. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  4225. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  4226. else if (op = OP_AND) and (not(dword(a))=0) then
  4227. list.concat(taicpu.op_reg_reg(A_MOV,dst,src))
  4228. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  4229. broader range of shifterconstants.}
  4230. {else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  4231. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))}
  4232. else if (op = OP_AND) and is_thumb32_imm(a) then
  4233. list.concat(taicpu.op_reg_reg_const(A_AND,dst,src,dword(a)))
  4234. else if (op = OP_AND) and (a = $FFFF) then
  4235. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  4236. else if (op = OP_AND) and is_thumb32_imm(not(dword(a))) then
  4237. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  4238. else if (op = OP_AND) and is_continuous_mask(aword(not(a)), shift, width) then
  4239. begin
  4240. a_load_reg_reg(list,size,size,src,dst);
  4241. list.concat(taicpu.op_reg_const_const(A_BFC,dst,shift,width))
  4242. end
  4243. else
  4244. begin
  4245. tmpreg:=getintregister(list,size);
  4246. a_load_const_reg(list,size,a,tmpreg);
  4247. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  4248. end;
  4249. end;
  4250. maybeadjustresult(list,op,size,dst);
  4251. end;
  4252. const
  4253. op_reg_reg_opcg2asmopThumb2: array[TOpCG] of tasmop =
  4254. (A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NONE,A_MVN,A_ORR,
  4255. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  4256. procedure tthumb2cgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4257. var
  4258. so : tshifterop;
  4259. tmpreg,overflowreg : tregister;
  4260. asmop : tasmop;
  4261. begin
  4262. ovloc.loc:=LOC_VOID;
  4263. case op of
  4264. OP_NEG,OP_NOT:
  4265. internalerror(200308286);
  4266. OP_ROL:
  4267. begin
  4268. if not(size in [OS_32,OS_S32]) then
  4269. internalerror(2008072801);
  4270. { simulate ROL by ror'ing 32-value }
  4271. tmpreg:=getintregister(list,OS_32);
  4272. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,32));
  4273. list.concat(taicpu.op_reg_reg_reg(A_SUB,src1,tmpreg,src1));
  4274. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4275. end;
  4276. OP_ROR:
  4277. begin
  4278. if not(size in [OS_32,OS_S32]) then
  4279. internalerror(2008072802);
  4280. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4281. end;
  4282. OP_IMUL,
  4283. OP_MUL:
  4284. begin
  4285. if cgsetflags or setflags then
  4286. begin
  4287. overflowreg:=getintregister(list,size);
  4288. if op=OP_IMUL then
  4289. asmop:=A_SMULL
  4290. else
  4291. asmop:=A_UMULL;
  4292. { the arm doesn't allow that rd and rm are the same }
  4293. if dst=src2 then
  4294. begin
  4295. if dst<>src1 then
  4296. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  4297. else
  4298. begin
  4299. tmpreg:=getintregister(list,size);
  4300. a_load_reg_reg(list,size,size,src2,dst);
  4301. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  4302. end;
  4303. end
  4304. else
  4305. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  4306. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4307. if op=OP_IMUL then
  4308. begin
  4309. shifterop_reset(so);
  4310. so.shiftmode:=SM_ASR;
  4311. so.shiftimm:=31;
  4312. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  4313. end
  4314. else
  4315. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  4316. ovloc.loc:=LOC_FLAGS;
  4317. ovloc.resflags:=F_NE;
  4318. end
  4319. else
  4320. begin
  4321. { the arm doesn't allow that rd and rm are the same }
  4322. if dst=src2 then
  4323. begin
  4324. if dst<>src1 then
  4325. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  4326. else
  4327. begin
  4328. tmpreg:=getintregister(list,size);
  4329. a_load_reg_reg(list,size,size,src2,dst);
  4330. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  4331. end;
  4332. end
  4333. else
  4334. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  4335. end;
  4336. end;
  4337. else
  4338. begin
  4339. if cgsetflags or setflags then
  4340. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4341. {$ifdef dummy}
  4342. { R13 is not allowed for certain instruction operands }
  4343. if op_reg_reg_opcg2asmopThumb2[op] in [A_ADD,A_SUB,A_AND,A_BIC,A_EOR] then
  4344. begin
  4345. if getsupreg(dst)=RS_R13 then
  4346. begin
  4347. tmpreg:=getintregister(list,OS_INT);
  4348. a_load_reg_reg(list,OS_INT,OS_INT,dst,tmpreg);
  4349. dst:=tmpreg;
  4350. end;
  4351. if getsupreg(src1)=RS_R13 then
  4352. begin
  4353. tmpreg:=getintregister(list,OS_INT);
  4354. a_load_reg_reg(list,OS_INT,OS_INT,src1,tmpreg);
  4355. src1:=tmpreg;
  4356. end;
  4357. end;
  4358. {$endif}
  4359. list.concat(setoppostfix(
  4360. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmopThumb2[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4361. end;
  4362. end;
  4363. maybeadjustresult(list,op,size,dst);
  4364. end;
  4365. procedure tthumb2cgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  4366. begin
  4367. list.concat(taicpu.op_cond(A_ITE, flags_to_cond(f)));
  4368. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  4369. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  4370. end;
  4371. procedure tthumb2cgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  4372. var
  4373. ref : treference;
  4374. shift : byte;
  4375. firstfloatreg,lastfloatreg,
  4376. r : byte;
  4377. regs : tcpuregisterset;
  4378. stackmisalignment: pint;
  4379. begin
  4380. LocalSize:=align(LocalSize,4);
  4381. { call instruction does not put anything on the stack }
  4382. stackmisalignment:=0;
  4383. if not(nostackframe) then
  4384. begin
  4385. firstfloatreg:=RS_NO;
  4386. lastfloatreg:=RS_NO;
  4387. { save floating point registers? }
  4388. for r:=RS_F0 to RS_F7 do
  4389. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4390. begin
  4391. if firstfloatreg=RS_NO then
  4392. firstfloatreg:=r;
  4393. lastfloatreg:=r;
  4394. inc(stackmisalignment,12);
  4395. end;
  4396. a_reg_alloc(list,NR_STACK_POINTER_REG);
  4397. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4398. begin
  4399. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  4400. a_reg_alloc(list,NR_R12);
  4401. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  4402. end;
  4403. { save int registers }
  4404. reference_reset(ref,4,[]);
  4405. ref.index:=NR_STACK_POINTER_REG;
  4406. ref.addressmode:=AM_PREINDEXED;
  4407. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4408. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4409. regs:=regs+[RS_FRAME_POINTER_REG,RS_R14]
  4410. else if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  4411. include(regs,RS_R14);
  4412. if regs<>[] then
  4413. begin
  4414. for r:=RS_R0 to RS_R15 do
  4415. if (r in regs) then
  4416. inc(stackmisalignment,4);
  4417. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4418. end;
  4419. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4420. begin
  4421. { the framepointer now points to the saved R15, so the saved
  4422. framepointer is at R11-12 (for get_caller_frame) }
  4423. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  4424. a_reg_dealloc(list,NR_R12);
  4425. end;
  4426. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4427. if (LocalSize<>0) or
  4428. ((stackmisalignment<>0) and
  4429. ((pi_do_call in current_procinfo.flags) or
  4430. (po_assembler in current_procinfo.procdef.procoptions))) then
  4431. begin
  4432. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4433. if not(is_shifter_const(localsize,shift)) then
  4434. begin
  4435. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  4436. a_reg_alloc(list,NR_R12);
  4437. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4438. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  4439. a_reg_dealloc(list,NR_R12);
  4440. end
  4441. else
  4442. begin
  4443. a_reg_dealloc(list,NR_R12);
  4444. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  4445. end;
  4446. end;
  4447. if firstfloatreg<>RS_NO then
  4448. begin
  4449. reference_reset(ref,4,[]);
  4450. if tg.direction*tcpuprocinfo(current_procinfo).floatregstart>=1023 then
  4451. begin
  4452. a_load_const_reg(list,OS_ADDR,-tcpuprocinfo(current_procinfo).floatregstart,NR_R12);
  4453. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4454. ref.base:=NR_R12;
  4455. end
  4456. else
  4457. begin
  4458. ref.base:=current_procinfo.framepointer;
  4459. ref.offset:=tcpuprocinfo(current_procinfo).floatregstart;
  4460. end;
  4461. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4462. lastfloatreg-firstfloatreg+1,ref));
  4463. end;
  4464. end;
  4465. end;
  4466. procedure tthumb2cgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  4467. var
  4468. ref : treference;
  4469. firstfloatreg,lastfloatreg,
  4470. r : byte;
  4471. shift : byte;
  4472. regs : tcpuregisterset;
  4473. LocalSize : longint;
  4474. stackmisalignment: pint;
  4475. begin
  4476. if not(nostackframe) then
  4477. begin
  4478. stackmisalignment:=0;
  4479. { restore floating point register }
  4480. firstfloatreg:=RS_NO;
  4481. lastfloatreg:=RS_NO;
  4482. { save floating point registers? }
  4483. for r:=RS_F0 to RS_F7 do
  4484. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4485. begin
  4486. if firstfloatreg=RS_NO then
  4487. firstfloatreg:=r;
  4488. lastfloatreg:=r;
  4489. { floating point register space is already included in
  4490. localsize below by calc_stackframe_size
  4491. inc(stackmisalignment,12);
  4492. }
  4493. end;
  4494. if firstfloatreg<>RS_NO then
  4495. begin
  4496. reference_reset(ref,4,[]);
  4497. if tg.direction*tcpuprocinfo(current_procinfo).floatregstart>=1023 then
  4498. begin
  4499. a_load_const_reg(list,OS_ADDR,-tcpuprocinfo(current_procinfo).floatregstart,NR_R12);
  4500. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4501. ref.base:=NR_R12;
  4502. end
  4503. else
  4504. begin
  4505. ref.base:=current_procinfo.framepointer;
  4506. ref.offset:=tcpuprocinfo(current_procinfo).floatregstart;
  4507. end;
  4508. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4509. lastfloatreg-firstfloatreg+1,ref));
  4510. end;
  4511. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4512. if (pi_do_call in current_procinfo.flags) or (regs<>[]) then
  4513. begin
  4514. exclude(regs,RS_R14);
  4515. include(regs,RS_R15);
  4516. end;
  4517. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  4518. regs:=regs+[RS_FRAME_POINTER_REG,RS_R15];
  4519. for r:=RS_R0 to RS_R15 do
  4520. if (r in regs) then
  4521. inc(stackmisalignment,4);
  4522. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4523. LocalSize:=current_procinfo.calc_stackframe_size;
  4524. if (LocalSize<>0) or
  4525. ((stackmisalignment<>0) and
  4526. ((pi_do_call in current_procinfo.flags) or
  4527. (po_assembler in current_procinfo.procdef.procoptions))) then
  4528. begin
  4529. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4530. if not(is_shifter_const(LocalSize,shift)) then
  4531. begin
  4532. a_reg_alloc(list,NR_R12);
  4533. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4534. list.concat(taicpu.op_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_R12));
  4535. a_reg_dealloc(list,NR_R12);
  4536. end
  4537. else
  4538. begin
  4539. a_reg_dealloc(list,NR_R12);
  4540. list.concat(taicpu.op_reg_const(A_ADD,NR_STACK_POINTER_REG,LocalSize));
  4541. end;
  4542. end;
  4543. if regs=[] then
  4544. list.concat(taicpu.op_reg(A_BX,NR_R14))
  4545. else
  4546. begin
  4547. reference_reset(ref,4,[]);
  4548. ref.index:=NR_STACK_POINTER_REG;
  4549. ref.addressmode:=AM_PREINDEXED;
  4550. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4551. end;
  4552. end
  4553. else
  4554. list.concat(taicpu.op_reg(A_BX,NR_R14));
  4555. end;
  4556. function tthumb2cgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  4557. var
  4558. tmpreg : tregister;
  4559. tmpref : treference;
  4560. l : tasmlabel;
  4561. begin
  4562. tmpreg:=NR_NO;
  4563. { Be sure to have a base register }
  4564. if (ref.base=NR_NO) then
  4565. begin
  4566. if ref.shiftmode<>SM_None then
  4567. internalerror(2014020706);
  4568. ref.base:=ref.index;
  4569. ref.index:=NR_NO;
  4570. end;
  4571. { absolute symbols can't be handled directly, we've to store the symbol reference
  4572. in the text segment and access it pc relative
  4573. For now, we assume that references where base or index equals to PC are already
  4574. relative, all other references are assumed to be absolute and thus they need
  4575. to be handled extra.
  4576. A proper solution would be to change refoptions to a set and store the information
  4577. if the symbol is absolute or relative there.
  4578. }
  4579. if (assigned(ref.symbol) and
  4580. not(is_pc(ref.base)) and
  4581. not(is_pc(ref.index))
  4582. ) or
  4583. { [#xxx] isn't a valid address operand }
  4584. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  4585. //(ref.offset<-4095) or
  4586. (ref.offset<-255) or
  4587. (ref.offset>4095) or
  4588. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  4589. ((ref.offset<-255) or
  4590. (ref.offset>255)
  4591. )
  4592. ) or
  4593. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  4594. ((ref.offset<-1020) or
  4595. (ref.offset>1020) or
  4596. ((abs(ref.offset) mod 4)<>0) or
  4597. { the usual pc relative symbol handling assumes possible offsets of +/- 4095 }
  4598. assigned(ref.symbol)
  4599. )
  4600. ) then
  4601. begin
  4602. reference_reset(tmpref,4,[]);
  4603. { load symbol }
  4604. tmpreg:=getintregister(list,OS_INT);
  4605. if assigned(ref.symbol) then
  4606. begin
  4607. current_asmdata.getjumplabel(l);
  4608. cg.a_label(current_procinfo.aktlocaldata,l);
  4609. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  4610. if ref.refaddr=addr_gottpoff then
  4611. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_gottpoff,ref.symbol,ref.relsymbol,ref.offset))
  4612. else
  4613. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset));
  4614. { load consts entry }
  4615. tmpref.symbol:=l;
  4616. tmpref.base:=NR_R15;
  4617. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  4618. { in case of LDF/STF, we got rid of the NR_R15 }
  4619. if is_pc(ref.base) then
  4620. ref.base:=NR_NO;
  4621. if is_pc(ref.index) then
  4622. ref.index:=NR_NO;
  4623. end
  4624. else
  4625. a_load_const_reg(list,OS_ADDR,ref.offset,tmpreg);
  4626. if (ref.base<>NR_NO) then
  4627. begin
  4628. if ref.index<>NR_NO then
  4629. begin
  4630. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4631. ref.base:=tmpreg;
  4632. end
  4633. else
  4634. begin
  4635. ref.index:=tmpreg;
  4636. ref.shiftimm:=0;
  4637. ref.signindex:=1;
  4638. ref.shiftmode:=SM_None;
  4639. end;
  4640. end
  4641. else
  4642. ref.base:=tmpreg;
  4643. ref.offset:=0;
  4644. ref.symbol:=nil;
  4645. end;
  4646. if (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  4647. begin
  4648. if tmpreg<>NR_NO then
  4649. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg,tmpreg)
  4650. else
  4651. begin
  4652. tmpreg:=getintregister(list,OS_ADDR);
  4653. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg);
  4654. ref.base:=tmpreg;
  4655. end;
  4656. ref.offset:=0;
  4657. end;
  4658. { Hack? Thumb2 doesn't allow PC indexed addressing modes(although it does in the specification) }
  4659. if (ref.base=NR_R15) and (ref.index<>NR_NO) and (ref.shiftmode <> sm_none) then
  4660. begin
  4661. tmpreg:=getintregister(list,OS_ADDR);
  4662. list.concat(taicpu.op_reg_reg(A_MOV, tmpreg, NR_R15));
  4663. ref.base := tmpreg;
  4664. end;
  4665. { floating point operations have only limited references
  4666. we expect here, that a base is already set }
  4667. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  4668. begin
  4669. if ref.shiftmode<>SM_none then
  4670. internalerror(200309121);
  4671. if tmpreg<>NR_NO then
  4672. begin
  4673. if ref.base=tmpreg then
  4674. begin
  4675. if ref.signindex<0 then
  4676. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,tmpreg,ref.index))
  4677. else
  4678. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,tmpreg,ref.index));
  4679. ref.index:=NR_NO;
  4680. end
  4681. else
  4682. begin
  4683. if ref.index<>tmpreg then
  4684. internalerror(200403161);
  4685. if ref.signindex<0 then
  4686. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,ref.base,tmpreg))
  4687. else
  4688. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4689. ref.base:=tmpreg;
  4690. ref.index:=NR_NO;
  4691. end;
  4692. end
  4693. else
  4694. begin
  4695. tmpreg:=getintregister(list,OS_ADDR);
  4696. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));
  4697. ref.base:=tmpreg;
  4698. ref.index:=NR_NO;
  4699. end;
  4700. end;
  4701. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  4702. Result := ref;
  4703. end;
  4704. procedure tthumb2cgarm.a_loadmm_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister; shuffle: pmmshuffle);
  4705. var
  4706. instr: taicpu;
  4707. begin
  4708. if (fromsize=OS_F32) and
  4709. (tosize=OS_F32) then
  4710. begin
  4711. instr:=setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32);
  4712. list.Concat(instr);
  4713. add_move_instruction(instr);
  4714. end
  4715. else if (fromsize=OS_F64) and
  4716. (tosize=OS_F64) then
  4717. begin
  4718. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,tregister(longint(reg2)+1),tregister(longint(reg1)+1)), PF_F32));
  4719. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32));
  4720. end
  4721. else if (fromsize=OS_F32) and
  4722. (tosize=OS_F64) then
  4723. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VCVT,reg2,reg1), PF_F32))
  4724. begin
  4725. //list.concat(nil);
  4726. end;
  4727. end;
  4728. procedure tthumb2cgarm.a_loadmm_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  4729. begin
  4730. handle_load_store(list,A_VLDR,PF_None,reg,ref);
  4731. end;
  4732. procedure tthumb2cgarm.a_loadmm_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  4733. begin
  4734. handle_load_store(list,A_VSTR,PF_None,reg,ref);
  4735. end;
  4736. procedure tthumb2cgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize: tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  4737. begin
  4738. if //(shuffle=nil) and
  4739. (tosize=OS_F32) then
  4740. list.Concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg))
  4741. else
  4742. internalerror(2012100813);
  4743. end;
  4744. procedure tthumb2cgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize: tcgsize; mmreg, intreg: tregister; shuffle: pmmshuffle);
  4745. begin
  4746. if //(shuffle=nil) and
  4747. (fromsize=OS_F32) then
  4748. list.Concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg))
  4749. else
  4750. internalerror(2012100814);
  4751. end;
  4752. procedure tthumb2cg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  4753. var tmpreg: tregister;
  4754. begin
  4755. case op of
  4756. OP_NEG:
  4757. begin
  4758. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4759. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  4760. tmpreg:=cg.getintregister(list,OS_32);
  4761. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,0));
  4762. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,tmpreg,regsrc.reghi));
  4763. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4764. end;
  4765. else
  4766. inherited a_op64_reg_reg(list, op, size, regsrc, regdst);
  4767. end;
  4768. end;
  4769. procedure tthumbcg64farm.a_op64_reg_reg(list: TAsmList; op: TOpCG; size: tcgsize; regsrc, regdst: tregister64);
  4770. begin
  4771. case op of
  4772. OP_NEG:
  4773. begin
  4774. list.concat(taicpu.op_reg_const(A_MOV,regdst.reglo,0));
  4775. list.concat(taicpu.op_reg_const(A_MOV,regdst.reghi,0));
  4776. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4777. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4778. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4779. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4780. end;
  4781. OP_NOT:
  4782. begin
  4783. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  4784. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  4785. end;
  4786. OP_AND,OP_OR,OP_XOR:
  4787. begin
  4788. cg.a_op_reg_reg(list,op,OS_32,regsrc.reglo,regdst.reglo);
  4789. cg.a_op_reg_reg(list,op,OS_32,regsrc.reghi,regdst.reghi);
  4790. end;
  4791. OP_ADD:
  4792. begin
  4793. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4794. list.concat(taicpu.op_reg_reg(A_ADD,regdst.reglo,regsrc.reglo));
  4795. list.concat(taicpu.op_reg_reg(A_ADC,regdst.reghi,regsrc.reghi));
  4796. end;
  4797. OP_SUB:
  4798. begin
  4799. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4800. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4801. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4802. end;
  4803. else
  4804. internalerror(2003083101);
  4805. end;
  4806. end;
  4807. procedure tthumbcg64farm.a_op64_const_reg(list: TAsmList; op: TOpCG; size: tcgsize; value: int64; reg: tregister64);
  4808. var
  4809. tmpreg : tregister;
  4810. begin
  4811. case op of
  4812. OP_AND,OP_OR,OP_XOR:
  4813. begin
  4814. cg.a_op_const_reg(list,op,OS_32,aint(lo(value)),reg.reglo);
  4815. cg.a_op_const_reg(list,op,OS_32,aint(hi(value)),reg.reghi);
  4816. end;
  4817. OP_ADD:
  4818. begin
  4819. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4820. begin
  4821. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4822. list.concat(taicpu.op_reg_const(A_ADD,reg.reglo,aint(lo(value))));
  4823. end
  4824. else
  4825. begin
  4826. tmpreg:=cg.getintregister(list,OS_32);
  4827. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4828. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4829. list.concat(taicpu.op_reg_reg(A_ADD,reg.reglo,tmpreg));
  4830. end;
  4831. tmpreg:=cg.getintregister(list,OS_32);
  4832. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  4833. list.concat(taicpu.op_reg_reg(A_ADC,reg.reghi,tmpreg));
  4834. end;
  4835. OP_SUB:
  4836. begin
  4837. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4838. begin
  4839. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4840. list.concat(taicpu.op_reg_const(A_SUB,reg.reglo,aint(lo(value))))
  4841. end
  4842. else
  4843. begin
  4844. tmpreg:=cg.getintregister(list,OS_32);
  4845. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4846. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4847. list.concat(taicpu.op_reg_reg(A_SUB,reg.reglo,tmpreg));
  4848. end;
  4849. tmpreg:=cg.getintregister(list,OS_32);
  4850. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  4851. list.concat(taicpu.op_reg_reg(A_SBC,reg.reghi,tmpreg));
  4852. end;
  4853. else
  4854. internalerror(2003083101);
  4855. end;
  4856. end;
  4857. procedure create_codegen;
  4858. begin
  4859. if GenerateThumb2Code then
  4860. begin
  4861. cg:=tthumb2cgarm.create;
  4862. cg64:=tthumb2cg64farm.create;
  4863. casmoptimizer:=TCpuThumb2AsmOptimizer;
  4864. end
  4865. else if GenerateThumbCode then
  4866. begin
  4867. cg:=tthumbcgarm.create;
  4868. cg64:=tthumbcg64farm.create;
  4869. // casmoptimizer:=TCpuThumbAsmOptimizer;
  4870. end
  4871. else
  4872. begin
  4873. cg:=tarmcgarm.create;
  4874. cg64:=tarmcg64farm.create;
  4875. casmoptimizer:=TCpuAsmOptimizer;
  4876. end;
  4877. end;
  4878. end.