cgcpu.pas 222 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912291329142915291629172918291929202921292229232924292529262927292829292930293129322933293429352936293729382939294029412942294329442945294629472948294929502951295229532954295529562957295829592960296129622963296429652966296729682969297029712972297329742975297629772978297929802981298229832984298529862987298829892990299129922993299429952996299729982999300030013002300330043005300630073008300930103011301230133014301530163017301830193020302130223023302430253026302730283029303030313032303330343035303630373038303930403041304230433044304530463047304830493050305130523053305430553056305730583059306030613062306330643065306630673068306930703071307230733074307530763077307830793080308130823083308430853086308730883089309030913092309330943095309630973098309931003101310231033104310531063107310831093110311131123113311431153116311731183119312031213122312331243125312631273128312931303131313231333134313531363137313831393140314131423143314431453146314731483149315031513152315331543155315631573158315931603161316231633164316531663167316831693170317131723173317431753176317731783179318031813182318331843185318631873188318931903191319231933194319531963197319831993200320132023203320432053206320732083209321032113212321332143215321632173218321932203221322232233224322532263227322832293230323132323233323432353236323732383239324032413242324332443245324632473248324932503251325232533254325532563257325832593260326132623263326432653266326732683269327032713272327332743275327632773278327932803281328232833284328532863287328832893290329132923293329432953296329732983299330033013302330333043305330633073308330933103311331233133314331533163317331833193320332133223323332433253326332733283329333033313332333333343335333633373338333933403341334233433344334533463347334833493350335133523353335433553356335733583359336033613362336333643365336633673368336933703371337233733374337533763377337833793380338133823383338433853386338733883389339033913392339333943395339633973398339934003401340234033404340534063407340834093410341134123413341434153416341734183419342034213422342334243425342634273428342934303431343234333434343534363437343834393440344134423443344434453446344734483449345034513452345334543455345634573458345934603461346234633464346534663467346834693470347134723473347434753476347734783479348034813482348334843485348634873488348934903491349234933494349534963497349834993500350135023503350435053506350735083509351035113512351335143515351635173518351935203521352235233524352535263527352835293530353135323533353435353536353735383539354035413542354335443545354635473548354935503551355235533554355535563557355835593560356135623563356435653566356735683569357035713572357335743575357635773578357935803581358235833584358535863587358835893590359135923593359435953596359735983599360036013602360336043605360636073608360936103611361236133614361536163617361836193620362136223623362436253626362736283629363036313632363336343635363636373638363936403641364236433644364536463647364836493650365136523653365436553656365736583659366036613662366336643665366636673668366936703671367236733674367536763677367836793680368136823683368436853686368736883689369036913692369336943695369636973698369937003701370237033704370537063707370837093710371137123713371437153716371737183719372037213722372337243725372637273728372937303731373237333734373537363737373837393740374137423743374437453746374737483749375037513752375337543755375637573758375937603761376237633764376537663767376837693770377137723773377437753776377737783779378037813782378337843785378637873788378937903791379237933794379537963797379837993800380138023803380438053806380738083809381038113812381338143815381638173818381938203821382238233824382538263827382838293830383138323833383438353836383738383839384038413842384338443845384638473848384938503851385238533854385538563857385838593860386138623863386438653866386738683869387038713872387338743875387638773878387938803881388238833884388538863887388838893890389138923893389438953896389738983899390039013902390339043905390639073908390939103911391239133914391539163917391839193920392139223923392439253926392739283929393039313932393339343935393639373938393939403941394239433944394539463947394839493950395139523953395439553956395739583959396039613962396339643965396639673968396939703971397239733974397539763977397839793980398139823983398439853986398739883989399039913992399339943995399639973998399940004001400240034004400540064007400840094010401140124013401440154016401740184019402040214022402340244025402640274028402940304031403240334034403540364037403840394040404140424043404440454046404740484049405040514052405340544055405640574058405940604061406240634064406540664067406840694070407140724073407440754076407740784079408040814082408340844085408640874088408940904091409240934094409540964097409840994100410141024103410441054106410741084109411041114112411341144115411641174118411941204121412241234124412541264127412841294130413141324133413441354136413741384139414041414142414341444145414641474148414941504151415241534154415541564157415841594160416141624163416441654166416741684169417041714172417341744175417641774178417941804181418241834184418541864187418841894190419141924193419441954196419741984199420042014202420342044205420642074208420942104211421242134214421542164217421842194220422142224223422442254226422742284229423042314232423342344235423642374238423942404241424242434244424542464247424842494250425142524253425442554256425742584259426042614262426342644265426642674268426942704271427242734274427542764277427842794280428142824283428442854286428742884289429042914292429342944295429642974298429943004301430243034304430543064307430843094310431143124313431443154316431743184319432043214322432343244325432643274328432943304331433243334334433543364337433843394340434143424343434443454346434743484349435043514352435343544355435643574358435943604361436243634364436543664367436843694370437143724373437443754376437743784379438043814382438343844385438643874388438943904391439243934394439543964397439843994400440144024403440444054406440744084409441044114412441344144415441644174418441944204421442244234424442544264427442844294430443144324433443444354436443744384439444044414442444344444445444644474448444944504451445244534454445544564457445844594460446144624463446444654466446744684469447044714472447344744475447644774478447944804481448244834484448544864487448844894490449144924493449444954496449744984499450045014502450345044505450645074508450945104511451245134514451545164517451845194520452145224523452445254526452745284529453045314532453345344535453645374538453945404541454245434544454545464547454845494550455145524553455445554556455745584559456045614562456345644565456645674568456945704571457245734574457545764577457845794580458145824583458445854586458745884589459045914592459345944595459645974598459946004601460246034604460546064607460846094610461146124613461446154616461746184619462046214622462346244625462646274628462946304631463246334634463546364637463846394640464146424643464446454646464746484649465046514652465346544655465646574658465946604661466246634664466546664667466846694670467146724673467446754676467746784679468046814682468346844685468646874688468946904691469246934694469546964697469846994700470147024703470447054706470747084709471047114712471347144715471647174718471947204721472247234724472547264727472847294730473147324733473447354736473747384739474047414742474347444745474647474748474947504751475247534754475547564757475847594760476147624763476447654766476747684769477047714772477347744775477647774778477947804781478247834784478547864787478847894790479147924793479447954796479747984799480048014802480348044805480648074808480948104811481248134814481548164817481848194820482148224823482448254826482748284829483048314832483348344835483648374838483948404841484248434844484548464847484848494850485148524853485448554856485748584859486048614862486348644865486648674868486948704871487248734874487548764877487848794880488148824883488448854886488748884889489048914892489348944895489648974898489949004901490249034904490549064907490849094910491149124913491449154916491749184919492049214922492349244925492649274928492949304931493249334934493549364937493849394940494149424943494449454946494749484949495049514952495349544955495649574958495949604961496249634964496549664967496849694970497149724973497449754976497749784979498049814982498349844985498649874988498949904991499249934994499549964997499849995000500150025003500450055006500750085009501050115012501350145015501650175018501950205021502250235024502550265027502850295030503150325033503450355036503750385039504050415042504350445045504650475048504950505051505250535054505550565057505850595060506150625063506450655066506750685069507050715072507350745075507650775078507950805081508250835084508550865087508850895090509150925093509450955096509750985099510051015102510351045105510651075108510951105111511251135114511551165117511851195120512151225123512451255126512751285129513051315132513351345135513651375138513951405141514251435144514551465147514851495150515151525153515451555156515751585159516051615162516351645165516651675168516951705171517251735174517551765177517851795180518151825183518451855186518751885189519051915192519351945195519651975198519952005201520252035204520552065207520852095210521152125213521452155216521752185219522052215222522352245225522652275228522952305231523252335234523552365237523852395240524152425243524452455246524752485249525052515252525352545255525652575258525952605261526252635264526552665267526852695270527152725273527452755276527752785279528052815282528352845285528652875288528952905291529252935294529552965297529852995300530153025303530453055306530753085309531053115312531353145315531653175318531953205321532253235324532553265327532853295330533153325333533453355336533753385339534053415342534353445345534653475348534953505351535253535354535553565357535853595360536153625363536453655366536753685369537053715372537353745375537653775378537953805381538253835384538553865387538853895390539153925393539453955396539753985399540054015402540354045405540654075408540954105411541254135414541554165417541854195420542154225423542454255426542754285429543054315432543354345435543654375438543954405441544254435444544554465447544854495450545154525453545454555456545754585459546054615462546354645465546654675468546954705471547254735474547554765477
  1. {
  2. Copyright (c) 2003 by Florian Klaempfl
  3. Member of the Free Pascal development team
  4. This unit implements the code generator for the ARM
  5. This program is free software; you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation; either version 2 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program; if not, write to the Free Software
  15. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  16. ****************************************************************************
  17. }
  18. unit cgcpu;
  19. {$i fpcdefs.inc}
  20. interface
  21. uses
  22. globtype,symtype,symdef,
  23. cgbase,cgutils,cgobj,
  24. aasmbase,aasmcpu,aasmtai,aasmdata,
  25. parabase,
  26. cpubase,cpuinfo,cg64f32,rgcpu;
  27. type
  28. { tbasecgarm is shared between all arm architectures }
  29. tbasecgarm = class(tcg)
  30. { true, if the next arithmetic operation should modify the flags }
  31. cgsetflags : boolean;
  32. procedure a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);override;
  33. protected
  34. procedure a_load_ref_cgparalocref(list: TAsmList; sourcesize: tcgsize; sizeleft: tcgint; const ref, paralocref: treference; const cgpara: tcgpara; const location: PCGParaLocation); override;
  35. procedure init_mmregister_allocator;
  36. public
  37. procedure a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);override;
  38. procedure a_call_name(list : TAsmList;const s : string; weak: boolean);override;
  39. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  40. { move instructions }
  41. procedure a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);override;
  42. procedure a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);override;
  43. function a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  44. function a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  45. { fpu move instructions }
  46. procedure a_loadfpu_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister); override;
  47. procedure a_loadfpu_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister); override;
  48. procedure a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference); override;
  49. procedure g_check_for_fpu_exception(list : TAsmList; force,clear : boolean); override;
  50. procedure a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);override;
  51. { comparison operations }
  52. procedure a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  53. l : tasmlabel);override;
  54. procedure a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel); override;
  55. procedure a_jmp_name(list : TAsmList;const s : string); override;
  56. procedure a_jmp_always(list : TAsmList;l: tasmlabel); override;
  57. procedure a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel); override;
  58. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  59. procedure g_profilecode(list : TAsmList); override;
  60. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  61. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  62. procedure g_maybe_got_init(list : TAsmList); override;
  63. procedure a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);override;
  64. procedure g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);override;
  65. procedure g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);override;
  66. procedure g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  67. procedure g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  68. procedure g_overflowcheck(list: TAsmList; const l: tlocation; def: tdef); override;
  69. procedure g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);override;
  70. procedure g_save_registers(list : TAsmList);override;
  71. procedure g_restore_registers(list : TAsmList);override;
  72. procedure a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  73. procedure fixref(list : TAsmList;var ref : treference);
  74. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; virtual;
  75. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  76. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  77. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  78. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  79. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  80. procedure a_opmm_reg_reg(list: TAsmList; Op: TOpCG; size : tcgsize;src,dst: tregister;shuffle : pmmshuffle); override;
  81. { Transform unsupported methods into Internal errors }
  82. procedure a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister); override;
  83. { try to generate optimized 32 Bit multiplication, returns true if successful generated }
  84. function try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  85. { clear out potential overflow bits from 8 or 16 bit operations
  86. the upper 24/16 bits of a register after an operation }
  87. procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  88. { mla for thumb requires that none of the registers is equal to r13/r15, this method ensures this }
  89. procedure safe_mla(list: TAsmList;op1,op2,op3,op4 : TRegister);
  90. procedure g_maybe_tls_init(list : TAsmList); override;
  91. end;
  92. { tcgarm is shared between normal arm and thumb-2 }
  93. tcgarm = class(tbasecgarm)
  94. procedure a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister); override;
  95. procedure a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference); override;
  96. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  97. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  98. size: tcgsize; a: tcgint; src, dst: tregister); override;
  99. procedure a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  100. size: tcgsize; src1, src2, dst: tregister); override;
  101. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  102. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  103. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  104. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  105. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  106. {Multiply two 32-bit registers into lo and hi 32-bit registers}
  107. procedure a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister); override;
  108. end;
  109. { normal arm cg }
  110. tarmcgarm = class(tcgarm)
  111. procedure init_register_allocators;override;
  112. procedure done_register_allocators;override;
  113. end;
  114. { 64 bit cg for all arm flavours }
  115. tbasecg64farm = class(tcg64f32)
  116. end;
  117. { tcg64farm is shared between normal arm and thumb-2 }
  118. tcg64farm = class(tbasecg64farm)
  119. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  120. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  121. procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;
  122. procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  123. procedure a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  124. procedure a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  125. procedure a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);override;
  126. procedure a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);override;
  127. end;
  128. tarmcg64farm = class(tcg64farm)
  129. end;
  130. tthumbcgarm = class(tbasecgarm)
  131. procedure init_register_allocators;override;
  132. procedure done_register_allocators;override;
  133. procedure g_proc_entry(list: TAsmList; localsize: longint; nostackframe: boolean);override;
  134. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  135. procedure a_op_reg_reg(list: TAsmList; Op: TOpCG; size: TCGSize; src,dst: TRegister);override;
  136. procedure a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);override;
  137. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister); override;
  138. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  139. procedure a_load_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const Ref: treference; reg: tregister);override;
  140. procedure a_load_const_reg(list: TAsmList; size: tcgsize; a: tcgint; reg: tregister);override;
  141. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  142. function handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference; override;
  143. end;
  144. tthumbcg64farm = class(tbasecg64farm)
  145. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  146. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  147. end;
  148. tthumb2cgarm = class(tcgarm)
  149. procedure init_register_allocators;override;
  150. procedure done_register_allocators;override;
  151. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  152. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  153. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  154. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  155. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  156. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  157. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  158. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  159. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  160. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; override;
  161. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  162. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  163. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  164. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  165. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  166. end;
  167. tthumb2cg64farm = class(tcg64farm)
  168. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  169. end;
  170. const
  171. OpCmp2AsmCond : Array[topcmp] of TAsmCond = (C_NONE,C_EQ,C_GT,
  172. C_LT,C_GE,C_LE,C_NE,C_LS,C_CC,C_CS,C_HI);
  173. winstackpagesize = 4096;
  174. function get_fpu_postfix(def : tdef) : toppostfix;
  175. procedure create_codegen;
  176. implementation
  177. uses
  178. globals,verbose,systems,cutils,
  179. aopt,aoptcpu,
  180. fmodule,
  181. symconst,symsym,symtable,
  182. tgobj,
  183. procinfo,cpupi,
  184. paramgr;
  185. { Range check must be disabled explicitly as conversions between signed and unsigned
  186. 32-bit values are done without explicit typecasts }
  187. {$R-}
  188. function get_fpu_postfix(def : tdef) : toppostfix;
  189. begin
  190. if def.typ=floatdef then
  191. begin
  192. case tfloatdef(def).floattype of
  193. s32real:
  194. result:=PF_S;
  195. s64real:
  196. result:=PF_D;
  197. s80real:
  198. result:=PF_E;
  199. else
  200. internalerror(200401272);
  201. end;
  202. end
  203. else
  204. internalerror(200401271);
  205. end;
  206. procedure tarmcgarm.init_register_allocators;
  207. begin
  208. inherited init_register_allocators;
  209. { currently, we always save R14, so we can use it }
  210. if (target_info.system<>system_arm_ios) then
  211. begin
  212. if assigned(current_procinfo) and (current_procinfo.framepointer<>NR_R11) then
  213. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  214. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  215. RS_R9,RS_R10,RS_R11,RS_R14],first_int_imreg,[])
  216. else
  217. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  218. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  219. RS_R9,RS_R10,RS_R14],first_int_imreg,[])
  220. end
  221. else
  222. { r7 is not available on Darwin, it's used as frame pointer (always,
  223. for backtrace support -- also in gcc/clang -> R11 can be used).
  224. r9 is volatile }
  225. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  226. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R9,RS_R12,RS_R4,RS_R5,RS_R6,RS_R8,
  227. RS_R10,RS_R11,RS_R14],first_int_imreg,[]);
  228. if FPUARM_HAS_FPA in fpu_capabilities[current_settings.fputype] then
  229. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  230. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  231. init_mmregister_allocator;
  232. end;
  233. procedure tarmcgarm.done_register_allocators;
  234. begin
  235. rg[R_INTREGISTER].free;
  236. rg[R_FPUREGISTER].free;
  237. rg[R_MMREGISTER].free;
  238. inherited done_register_allocators;
  239. end;
  240. procedure tcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  241. var
  242. imm_shift : byte;
  243. l : tasmlabel;
  244. hr : treference;
  245. imm1, imm2: DWord;
  246. begin
  247. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  248. internalerror(2002090907);
  249. if is_shifter_const(a,imm_shift) then
  250. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  251. else if is_shifter_const(not(a),imm_shift) then
  252. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  253. { loading of constants with mov and orr }
  254. else if (split_into_shifter_const(a,imm1, imm2)) then
  255. begin
  256. list.concat(taicpu.op_reg_const(A_MOV,reg, imm1));
  257. list.concat(taicpu.op_reg_reg_const(A_ORR,reg,reg, imm2));
  258. end
  259. { loading of constants with mvn and bic }
  260. else if (split_into_shifter_const(not(a), imm1, imm2)) then
  261. begin
  262. list.concat(taicpu.op_reg_const(A_MVN,reg, imm1));
  263. list.concat(taicpu.op_reg_reg_const(A_BIC,reg,reg, imm2));
  264. end
  265. else
  266. begin
  267. reference_reset(hr,4,[]);
  268. current_asmdata.getjumplabel(l);
  269. cg.a_label(current_procinfo.aktlocaldata,l);
  270. hr.symboldata:=current_procinfo.aktlocaldata.last;
  271. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  272. hr.symbol:=l;
  273. hr.base:=NR_PC;
  274. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  275. end;
  276. end;
  277. procedure tcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  278. var
  279. oppostfix:toppostfix;
  280. usedtmpref: treference;
  281. tmpreg,tmpreg2 : tregister;
  282. so : tshifterop;
  283. dir : integer;
  284. begin
  285. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  286. FromSize := ToSize;
  287. case FromSize of
  288. { signed integer registers }
  289. OS_8:
  290. oppostfix:=PF_B;
  291. OS_S8:
  292. oppostfix:=PF_SB;
  293. OS_16:
  294. oppostfix:=PF_H;
  295. OS_S16:
  296. oppostfix:=PF_SH;
  297. OS_32,
  298. OS_S32:
  299. oppostfix:=PF_None;
  300. else
  301. InternalError(200308297);
  302. end;
  303. if (fromsize=OS_S8) and
  304. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  305. oppostfix:=PF_B;
  306. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize])) or
  307. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  308. (oppostfix in [PF_SH,PF_H])) then
  309. begin
  310. if target_info.endian=endian_big then
  311. dir:=-1
  312. else
  313. dir:=1;
  314. case FromSize of
  315. OS_16,OS_S16:
  316. begin
  317. { only complicated references need an extra loadaddr }
  318. if assigned(ref.symbol) or
  319. (ref.index<>NR_NO) or
  320. (ref.offset<-4095) or
  321. (ref.offset>4094) or
  322. { sometimes the compiler reused registers }
  323. (reg=ref.index) or
  324. (reg=ref.base) then
  325. begin
  326. tmpreg2:=getintregister(list,OS_INT);
  327. a_loadaddr_ref_reg(list,ref,tmpreg2);
  328. reference_reset_base(usedtmpref,tmpreg2,0,ref.temppos,ref.alignment,ref.volatility);
  329. end
  330. else
  331. usedtmpref:=ref;
  332. if target_info.endian=endian_big then
  333. inc(usedtmpref.offset,1);
  334. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  335. tmpreg:=getintregister(list,OS_INT);
  336. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  337. inc(usedtmpref.offset,dir);
  338. if FromSize=OS_16 then
  339. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  340. else
  341. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  342. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  343. end;
  344. OS_32,OS_S32:
  345. begin
  346. tmpreg:=getintregister(list,OS_INT);
  347. { only complicated references need an extra loadaddr }
  348. if assigned(ref.symbol) or
  349. (ref.index<>NR_NO) or
  350. (ref.offset<-4095) or
  351. (ref.offset>4092) or
  352. { sometimes the compiler reused registers }
  353. (reg=ref.index) or
  354. (reg=ref.base) then
  355. begin
  356. tmpreg2:=getintregister(list,OS_INT);
  357. a_loadaddr_ref_reg(list,ref,tmpreg2);
  358. reference_reset_base(usedtmpref,tmpreg2,0,ref.temppos,ref.alignment,ref.volatility);
  359. end
  360. else
  361. usedtmpref:=ref;
  362. shifterop_reset(so);so.shiftmode:=SM_LSL;
  363. if ref.alignment=2 then
  364. begin
  365. if target_info.endian=endian_big then
  366. inc(usedtmpref.offset,2);
  367. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  368. inc(usedtmpref.offset,dir*2);
  369. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  370. so.shiftimm:=16;
  371. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  372. end
  373. else
  374. begin
  375. tmpreg2:=getintregister(list,OS_INT);
  376. if target_info.endian=endian_big then
  377. inc(usedtmpref.offset,3);
  378. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  379. inc(usedtmpref.offset,dir);
  380. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  381. inc(usedtmpref.offset,dir);
  382. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg2);
  383. so.shiftimm:=8;
  384. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  385. inc(usedtmpref.offset,dir);
  386. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  387. so.shiftimm:=16;
  388. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg2,so));
  389. so.shiftimm:=24;
  390. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  391. end;
  392. end
  393. else
  394. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  395. end;
  396. end
  397. else
  398. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  399. if (fromsize=OS_S8) and
  400. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  401. a_load_reg_reg(list,OS_S8,OS_32,reg,reg)
  402. else if (fromsize=OS_S8) and (tosize = OS_16) then
  403. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  404. end;
  405. procedure tcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  406. var
  407. hsym : tsym;
  408. href : treference;
  409. paraloc : Pcgparalocation;
  410. shift : byte;
  411. begin
  412. { calculate the parameter info for the procdef }
  413. procdef.init_paraloc_info(callerside);
  414. hsym:=tsym(procdef.parast.Find('self'));
  415. if not(assigned(hsym) and
  416. (hsym.typ=paravarsym)) then
  417. internalerror(2003052503);
  418. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  419. while paraloc<>nil do
  420. with paraloc^ do
  421. begin
  422. case loc of
  423. LOC_REGISTER:
  424. begin
  425. if is_shifter_const(ioffset,shift) then
  426. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  427. else
  428. begin
  429. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  430. a_op_reg_reg(list,OP_SUB,size,NR_R12,register);
  431. end;
  432. end;
  433. LOC_REFERENCE:
  434. begin
  435. { offset in the wrapper needs to be adjusted for the stored
  436. return address }
  437. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),ctempposinvalid,sizeof(pint),[]);
  438. if is_shifter_const(ioffset,shift) then
  439. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  440. else
  441. begin
  442. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  443. a_op_reg_ref(list,OP_SUB,size,NR_R12,href);
  444. end;
  445. end
  446. else
  447. internalerror(2003091803);
  448. end;
  449. paraloc:=next;
  450. end;
  451. end;
  452. procedure tbasecgarm.a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);
  453. var
  454. ref: treference;
  455. begin
  456. paraloc.check_simple_location;
  457. paramanager.allocparaloc(list,paraloc.location);
  458. case paraloc.location^.loc of
  459. LOC_REGISTER,LOC_CREGISTER:
  460. a_load_const_reg(list,size,a,paraloc.location^.register);
  461. LOC_REFERENCE:
  462. begin
  463. reference_reset(ref,paraloc.alignment,[]);
  464. ref.base:=paraloc.location^.reference.index;
  465. ref.offset:=paraloc.location^.reference.offset;
  466. a_load_const_ref(list,size,a,ref);
  467. end;
  468. else
  469. internalerror(2002081101);
  470. end;
  471. end;
  472. procedure tbasecgarm.a_load_ref_cgparalocref(list: TAsmList; sourcesize: tcgsize; sizeleft: tcgint; const ref, paralocref: treference; const cgpara: tcgpara; const location: PCGParaLocation);
  473. begin
  474. { doubles in softemu mode have a strange order of registers and references }
  475. if (cgpara.size=OS_F64) and
  476. (location^.size=OS_32) then
  477. begin
  478. g_concatcopy(list,ref,paralocref,4)
  479. end
  480. else
  481. inherited;
  482. end;
  483. procedure tbasecgarm.init_mmregister_allocator;
  484. begin
  485. { The register allocator currently cannot deal with multiple
  486. non-overlapping subregs per register, so we can only use
  487. half the single precision registers for now (as sub registers of the
  488. double precision ones). }
  489. if (FPUARM_HAS_32REGS in fpu_capabilities[current_settings.fputype]) and
  490. (FPUARM_HAS_VFP_DOUBLE in fpu_capabilities[current_settings.fputype]) then
  491. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  492. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  493. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  494. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  495. ],first_mm_imreg,[])
  496. else if (FPUARM_HAS_32REGS in fpu_capabilities[current_settings.fputype]) then
  497. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFS,
  498. [RS_S0,RS_S1,RS_S2,RS_S3,RS_S4,RS_S5,RS_S6,RS_S7,
  499. RS_S16,RS_S17,RS_S18,RS_S19,RS_S20,RS_S21,RS_S22,RS_S23,RS_S24,RS_S25,RS_S26,RS_S27,RS_S28,RS_S29,RS_S30,RS_S31,
  500. RS_S8,RS_S9,RS_S10,RS_S11,RS_S12,RS_S13,RS_S14,RS_S15
  501. ],first_mm_imreg,[])
  502. else if FPUARM_HAS_VFP_EXTENSION in fpu_capabilities[current_settings.fputype] then
  503. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  504. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  505. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  506. ],first_mm_imreg,[]);
  507. end;
  508. procedure tbasecgarm.a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);
  509. var
  510. ref: treference;
  511. tmpreg: tregister;
  512. begin
  513. paraloc.check_simple_location;
  514. paramanager.allocparaloc(list,paraloc.location);
  515. case paraloc.location^.loc of
  516. LOC_REGISTER,LOC_CREGISTER:
  517. a_loadaddr_ref_reg(list,r,paraloc.location^.register);
  518. LOC_REFERENCE:
  519. begin
  520. reference_reset(ref,paraloc.alignment,[]);
  521. ref.base := paraloc.location^.reference.index;
  522. ref.offset := paraloc.location^.reference.offset;
  523. tmpreg := getintregister(list,OS_ADDR);
  524. a_loadaddr_ref_reg(list,r,tmpreg);
  525. a_load_reg_ref(list,OS_ADDR,OS_ADDR,tmpreg,ref);
  526. end;
  527. else
  528. internalerror(2002080701);
  529. end;
  530. end;
  531. procedure tbasecgarm.a_call_name(list : TAsmList;const s : string; weak: boolean);
  532. var
  533. branchopcode: tasmop;
  534. r : treference;
  535. sym : TAsmSymbol;
  536. begin
  537. { use always BL as newer binutils do not translate blx apparently
  538. generating BL is also what clang and gcc do by default }
  539. branchopcode:=A_BL;
  540. if not(weak) then
  541. sym:=current_asmdata.RefAsmSymbol(s,AT_FUNCTION)
  542. else
  543. sym:=current_asmdata.WeakRefAsmSymbol(s,AT_FUNCTION);
  544. reference_reset_symbol(r,sym,0,sizeof(pint),[]);
  545. if (tf_pic_uses_got in target_info.flags) and
  546. (cs_create_pic in current_settings.moduleswitches) then
  547. begin
  548. r.refaddr:=addr_pic
  549. end
  550. else
  551. r.refaddr:=addr_full;
  552. list.concat(taicpu.op_ref(branchopcode,r));
  553. {
  554. the compiler does not properly set this flag anymore in pass 1, and
  555. for now we only need it after pass 2 (I hope) (JM)
  556. if not(pi_do_call in current_procinfo.flags) then
  557. internalerror(2003060703);
  558. }
  559. include(current_procinfo.flags,pi_do_call);
  560. end;
  561. procedure tbasecgarm.a_call_reg(list : TAsmList;reg: tregister);
  562. begin
  563. { check not really correct: should only be used for non-Thumb cpus }
  564. if not(CPUARM_HAS_BLX in cpu_capabilities[current_settings.cputype]) then
  565. begin
  566. list.concat(taicpu.op_reg_reg(A_MOV,NR_R14,NR_PC));
  567. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,reg));
  568. end
  569. else
  570. list.concat(taicpu.op_reg(A_BLX, reg));
  571. {
  572. the compiler does not properly set this flag anymore in pass 1, and
  573. for now we only need it after pass 2 (I hope) (JM)
  574. if not(pi_do_call in current_procinfo.flags) then
  575. internalerror(2003060703);
  576. }
  577. include(current_procinfo.flags,pi_do_call);
  578. end;
  579. procedure tcgarm.a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister);
  580. begin
  581. a_op_const_reg_reg(list,op,size,a,reg,reg);
  582. end;
  583. procedure tcgarm.a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference);
  584. var
  585. tmpreg,tmpresreg : tregister;
  586. tmpref : treference;
  587. begin
  588. tmpreg:=getintregister(list,size);
  589. tmpresreg:=getintregister(list,size);
  590. tmpref:=a_internal_load_ref_reg(list,size,size,ref,tmpreg);
  591. a_op_const_reg_reg(list,op,size,a,tmpreg,tmpresreg);
  592. a_load_reg_ref(list,size,size,tmpresreg,tmpref);
  593. end;
  594. procedure tcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  595. var
  596. so : tshifterop;
  597. begin
  598. if op = OP_NEG then
  599. begin
  600. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,src,0));
  601. maybeadjustresult(list,OP_NEG,size,dst);
  602. end
  603. else if op = OP_NOT then
  604. begin
  605. if size in [OS_8, OS_16, OS_S8, OS_S16] then
  606. begin
  607. shifterop_reset(so);
  608. so.shiftmode:=SM_LSL;
  609. if size in [OS_8, OS_S8] then
  610. so.shiftimm:=24
  611. else
  612. so.shiftimm:=16;
  613. list.concat(taicpu.op_reg_reg_shifterop(A_MVN,dst,src,so));
  614. {Using a shift here allows this to be folded into another instruction}
  615. if size in [OS_S8, OS_S16] then
  616. so.shiftmode:=SM_ASR
  617. else
  618. so.shiftmode:=SM_LSR;
  619. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  620. end
  621. else
  622. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  623. end
  624. else
  625. a_op_reg_reg_reg(list,op,size,src,dst,dst);
  626. end;
  627. const
  628. op_reg_reg_opcg2asmop: array[TOpCG] of tasmop =
  629. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  630. A_NONE,A_NONE,A_NONE,A_SUB,A_EOR,A_NONE,A_NONE);
  631. op_reg_opcg2asmop: array[TOpCG] of tasmop =
  632. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  633. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  634. op_reg_postfix_thumb: array[TOpCG] of TOpPostfix =
  635. (PF_None,PF_None,PF_None,PF_S,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_S,
  636. PF_None,PF_S,PF_S,PF_None,PF_S,PF_None,PF_S);
  637. procedure tcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  638. size: tcgsize; a: tcgint; src, dst: tregister);
  639. var
  640. ovloc : tlocation;
  641. begin
  642. a_op_const_reg_reg_checkoverflow(list,op,size,a,src,dst,false,ovloc);
  643. end;
  644. procedure tcgarm.a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  645. size: tcgsize; src1, src2, dst: tregister);
  646. var
  647. ovloc : tlocation;
  648. begin
  649. a_op_reg_reg_reg_checkoverflow(list,op,size,src1,src2,dst,false,ovloc);
  650. end;
  651. function opshift2shiftmode(op: TOpCg): tshiftmode;
  652. begin
  653. case op of
  654. OP_SHL: Result:=SM_LSL;
  655. OP_SHR: Result:=SM_LSR;
  656. OP_ROR: Result:=SM_ROR;
  657. OP_ROL: Result:=SM_ROR;
  658. OP_SAR: Result:=SM_ASR;
  659. else internalerror(2012070501);
  660. end
  661. end;
  662. function tbasecgarm.try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  663. var
  664. multiplier : dword;
  665. power : longint;
  666. shifterop : tshifterop;
  667. bitsset : byte;
  668. negative : boolean;
  669. first : boolean;
  670. b,
  671. cycles : byte;
  672. maxeffort : byte;
  673. begin
  674. result:=true;
  675. cycles:=0;
  676. negative:=a<0;
  677. shifterop.rs:=NR_NO;
  678. shifterop.shiftmode:=SM_LSL;
  679. if negative then
  680. inc(cycles);
  681. multiplier:=dword(abs(a));
  682. bitsset:=popcnt(multiplier and $fffffffe);
  683. { heuristics to estimate how much instructions are reasonable to replace the mul,
  684. this is currently based on XScale timings }
  685. { in the simplest case, we need a mov to load the constant and a mul to carry out the
  686. actual multiplication, this requires min. 1+4 cycles
  687. because the first shift imm. might cause a stall and because we need more instructions
  688. when replacing the mul we generate max. 3 instructions to replace this mul }
  689. maxeffort:=3;
  690. { if the constant is not a shifter op, we need either some mov/mvn/bic/or sequence or
  691. a ldr, so generating one more operation to replace this is beneficial }
  692. if not(is_shifter_const(dword(a),b)) and not(is_shifter_const(not(dword(a)),b)) then
  693. inc(maxeffort);
  694. { if the upper 5 bits are all set or clear, mul is one cycle faster }
  695. if ((dword(a) and $f8000000)=0) or ((dword(a) and $f8000000)=$f8000000) then
  696. dec(maxeffort);
  697. { if the upper 17 bits are all set or clear, mul is another cycle faster }
  698. if ((dword(a) and $ffff8000)=0) or ((dword(a) and $ffff8000)=$ffff8000) then
  699. dec(maxeffort);
  700. { most simple cases }
  701. if a=1 then
  702. a_load_reg_reg(list,OS_32,OS_32,src,dst)
  703. else if a=0 then
  704. a_load_const_reg(list,OS_32,0,dst)
  705. else if a=-1 then
  706. a_op_reg_reg(list,OP_NEG,OS_32,src,dst)
  707. { add up ?
  708. basically, one add is needed for each bit being set in the constant factor
  709. however, the least significant bit is for free, it can be hidden in the initial
  710. instruction
  711. }
  712. else if (bitsset+cycles<=maxeffort) and
  713. (bitsset<=popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)) then
  714. begin
  715. first:=true;
  716. while multiplier<>0 do
  717. begin
  718. shifterop.shiftimm:=BsrDWord(multiplier);
  719. if odd(multiplier) then
  720. begin
  721. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,shifterop));
  722. dec(multiplier);
  723. end
  724. else
  725. if first then
  726. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  727. else
  728. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,src,shifterop));
  729. first:=false;
  730. dec(multiplier,1 shl shifterop.shiftimm);
  731. end;
  732. if negative then
  733. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  734. end
  735. { subtract from the next greater power of two? }
  736. else if popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)+cycles+1<=maxeffort then
  737. begin
  738. first:=true;
  739. while multiplier<>0 do
  740. begin
  741. if first then
  742. begin
  743. multiplier:=(1 shl power)-multiplier;
  744. shifterop.shiftimm:=power;
  745. end
  746. else
  747. shifterop.shiftimm:=BsrDWord(multiplier);
  748. if odd(multiplier) then
  749. begin
  750. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,shifterop));
  751. dec(multiplier);
  752. end
  753. else
  754. if first then
  755. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  756. else
  757. begin
  758. list.concat(taicpu.op_reg_reg_reg_shifterop(A_SUB,dst,dst,src,shifterop));
  759. dec(multiplier,1 shl shifterop.shiftimm);
  760. end;
  761. first:=false;
  762. end;
  763. if negative then
  764. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  765. end
  766. else
  767. result:=false;
  768. end;
  769. procedure tcgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  770. var
  771. shift, lsb, width : byte;
  772. tmpreg : tregister;
  773. so : tshifterop;
  774. l1 : longint;
  775. imm1, imm2: DWord;
  776. begin
  777. optimize_op_const(size, op, a);
  778. case op of
  779. OP_NONE:
  780. begin
  781. if src <> dst then
  782. a_load_reg_reg(list, size, size, src, dst);
  783. exit;
  784. end;
  785. OP_MOVE:
  786. begin
  787. a_load_const_reg(list, size, a, dst);
  788. exit;
  789. end;
  790. else
  791. ;
  792. end;
  793. ovloc.loc:=LOC_VOID;
  794. if (a<>-2147483648) and not setflags and is_shifter_const(-a,shift) then
  795. case op of
  796. OP_ADD:
  797. begin
  798. op:=OP_SUB;
  799. a:=aint(dword(-a));
  800. end;
  801. OP_SUB:
  802. begin
  803. op:=OP_ADD;
  804. a:=aint(dword(-a));
  805. end
  806. else
  807. ;
  808. end;
  809. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  810. case op of
  811. OP_NEG,OP_NOT:
  812. internalerror(200308281);
  813. OP_SHL,
  814. OP_SHR,
  815. OP_ROL,
  816. OP_ROR,
  817. OP_SAR:
  818. begin
  819. if a>32 then
  820. internalerror(200308294);
  821. shifterop_reset(so);
  822. so.shiftmode:=opshift2shiftmode(op);
  823. if op = OP_ROL then
  824. so.shiftimm:=32-a
  825. else
  826. so.shiftimm:=a;
  827. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  828. end;
  829. else
  830. {if (op in [OP_SUB, OP_ADD]) and
  831. ((a < 0) or
  832. (a > 4095)) then
  833. begin
  834. tmpreg:=getintregister(list,size);
  835. list.concat(taicpu.op_reg_const(A_MOVT, tmpreg, (a shr 16) and $FFFF));
  836. list.concat(taicpu.op_reg_const(A_MOV, tmpreg, a and $FFFF));
  837. list.concat(setoppostfix(taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))
  838. ));
  839. end
  840. else}
  841. begin
  842. if cgsetflags or setflags then
  843. a_reg_alloc(list,NR_DEFAULTFLAGS);
  844. list.concat(setoppostfix(
  845. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  846. end;
  847. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  848. begin
  849. ovloc.loc:=LOC_FLAGS;
  850. case op of
  851. OP_ADD:
  852. ovloc.resflags:=F_CS;
  853. OP_SUB:
  854. ovloc.resflags:=F_CC;
  855. else
  856. internalerror(2019050922);
  857. end;
  858. end;
  859. end
  860. else
  861. begin
  862. { there could be added some more sophisticated optimizations }
  863. if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  864. a_op_reg_reg(list,OP_NEG,size,src,dst)
  865. { we do this here instead in the peephole optimizer because
  866. it saves us a register }
  867. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  868. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  869. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  870. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  871. begin
  872. if l1>32 then{roozbeh does this ever happen?}
  873. internalerror(200308296);
  874. shifterop_reset(so);
  875. so.shiftmode:=SM_LSL;
  876. so.shiftimm:=l1;
  877. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  878. end
  879. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  880. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  881. begin
  882. if l1>32 then{does this ever happen?}
  883. internalerror(201205181);
  884. shifterop_reset(so);
  885. so.shiftmode:=SM_LSL;
  886. so.shiftimm:=l1;
  887. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  888. end
  889. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  890. begin
  891. { nothing to do on success }
  892. end
  893. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  894. broader range of shifterconstants.}
  895. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  896. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  897. { Doing two shifts instead of two bics might allow the peephole optimizer to fold the second shift
  898. into the following instruction}
  899. else if (op = OP_AND) and
  900. is_continuous_mask(aword(a), lsb, width) and
  901. ((lsb = 0) or ((lsb + width) = 32)) then
  902. begin
  903. shifterop_reset(so);
  904. if (width = 16) and
  905. (lsb = 0) and
  906. (current_settings.cputype >= cpu_armv6) then
  907. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  908. else if (width = 8) and
  909. (lsb = 0) and
  910. (current_settings.cputype >= cpu_armv6) then
  911. list.concat(taicpu.op_reg_reg(A_UXTB,dst,src))
  912. else if lsb = 0 then
  913. begin
  914. so.shiftmode:=SM_LSL;
  915. so.shiftimm:=32-width;
  916. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  917. so.shiftmode:=SM_LSR;
  918. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  919. end
  920. else
  921. begin
  922. so.shiftmode:=SM_LSR;
  923. so.shiftimm:=lsb;
  924. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  925. so.shiftmode:=SM_LSL;
  926. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  927. end;
  928. end
  929. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  930. begin
  931. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,imm1));
  932. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  933. end
  934. else if (op in [OP_ADD, OP_SUB, OP_OR, OP_XOR]) and
  935. not(cgsetflags or setflags) and
  936. split_into_shifter_const(a, imm1, imm2) then
  937. begin
  938. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,imm1));
  939. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  940. end
  941. else
  942. begin
  943. tmpreg:=getintregister(list,size);
  944. a_load_const_reg(list,size,a,tmpreg);
  945. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  946. end;
  947. end;
  948. maybeadjustresult(list,op,size,dst);
  949. end;
  950. procedure tcgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  951. var
  952. so : tshifterop;
  953. tmpreg,overflowreg : tregister;
  954. asmop : tasmop;
  955. begin
  956. ovloc.loc:=LOC_VOID;
  957. case op of
  958. OP_NEG,OP_NOT,
  959. OP_DIV,OP_IDIV:
  960. internalerror(200308283);
  961. OP_SHL,
  962. OP_SHR,
  963. OP_SAR,
  964. OP_ROR:
  965. begin
  966. if (op = OP_ROR) and not(size in [OS_32,OS_S32]) then
  967. internalerror(2008072801);
  968. shifterop_reset(so);
  969. so.rs:=src1;
  970. so.shiftmode:=opshift2shiftmode(op);
  971. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  972. end;
  973. OP_ROL:
  974. begin
  975. if not(size in [OS_32,OS_S32]) then
  976. internalerror(2008072804);
  977. { simulate ROL by ror'ing 32-value }
  978. tmpreg:=getintregister(list,OS_32);
  979. list.concat(taicpu.op_reg_reg_const(A_RSB,tmpreg,src1, 32));
  980. shifterop_reset(so);
  981. so.rs:=tmpreg;
  982. so.shiftmode:=SM_ROR;
  983. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  984. end;
  985. OP_IMUL,
  986. OP_MUL:
  987. begin
  988. if (cgsetflags or setflags) and
  989. (CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype]) then
  990. begin
  991. overflowreg:=getintregister(list,size);
  992. if op=OP_IMUL then
  993. asmop:=A_SMULL
  994. else
  995. asmop:=A_UMULL;
  996. { the arm doesn't allow that rd and rm are the same }
  997. if dst=src2 then
  998. begin
  999. if dst<>src1 then
  1000. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  1001. else
  1002. begin
  1003. tmpreg:=getintregister(list,size);
  1004. a_load_reg_reg(list,size,size,src2,dst);
  1005. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  1006. end;
  1007. end
  1008. else
  1009. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  1010. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1011. if op=OP_IMUL then
  1012. begin
  1013. shifterop_reset(so);
  1014. so.shiftmode:=SM_ASR;
  1015. so.shiftimm:=31;
  1016. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  1017. end
  1018. else
  1019. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  1020. ovloc.loc:=LOC_FLAGS;
  1021. ovloc.resflags:=F_NE;
  1022. end
  1023. else
  1024. begin
  1025. { the arm doesn't allow that rd and rm are the same }
  1026. if dst=src2 then
  1027. begin
  1028. if dst<>src1 then
  1029. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  1030. else
  1031. begin
  1032. tmpreg:=getintregister(list,size);
  1033. a_load_reg_reg(list,size,size,src2,dst);
  1034. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  1035. end;
  1036. end
  1037. else
  1038. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  1039. end;
  1040. end;
  1041. else
  1042. begin
  1043. if cgsetflags or setflags then
  1044. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1045. list.concat(setoppostfix(
  1046. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  1047. end;
  1048. end;
  1049. maybeadjustresult(list,op,size,dst);
  1050. end;
  1051. procedure tcgarm.a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister);
  1052. var
  1053. asmop: tasmop;
  1054. begin
  1055. if CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype] then
  1056. begin
  1057. list.concat(tai_comment.create(strpnew('tcgarm.a_mul_reg_reg_pair called')));
  1058. case size of
  1059. OS_32: asmop:=A_UMULL;
  1060. OS_S32: asmop:=A_SMULL;
  1061. else
  1062. InternalError(2014060802);
  1063. end;
  1064. { The caller might omit dstlo or dsthi, when he is not interested in it, we still
  1065. need valid registers everywhere. In case of dsthi = NR_NO we could fall back to
  1066. 32x32=32 bit multiplication}
  1067. if (dstlo = NR_NO) then
  1068. dstlo:=getintregister(list,size);
  1069. if (dsthi = NR_NO) then
  1070. dsthi:=getintregister(list,size);
  1071. list.concat(taicpu.op_reg_reg_reg_reg(asmop, dstlo, dsthi, src1,src2));
  1072. end
  1073. else if dsthi=NR_NO then
  1074. begin
  1075. if (dstlo = NR_NO) then
  1076. dstlo:=getintregister(list,size);
  1077. list.concat(taicpu.op_reg_reg_reg(A_MUL, dstlo, src1,src2));
  1078. end
  1079. else
  1080. begin
  1081. internalerror(2015083022);
  1082. end;
  1083. end;
  1084. function tbasecgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  1085. var
  1086. tmpreg1,tmpreg2 : tregister;
  1087. begin
  1088. tmpreg1:=NR_NO;
  1089. { Be sure to have a base register }
  1090. if (ref.base=NR_NO) then
  1091. begin
  1092. if ref.shiftmode<>SM_None then
  1093. internalerror(2014020707);
  1094. ref.base:=ref.index;
  1095. ref.index:=NR_NO;
  1096. end;
  1097. { absolute symbols can't be handled directly, we've to store the symbol reference
  1098. in the text segment and access it pc relative
  1099. For now, we assume that references where base or index equals to PC are already
  1100. relative, all other references are assumed to be absolute and thus they need
  1101. to be handled extra.
  1102. A proper solution would be to change refoptions to a set and store the information
  1103. if the symbol is absolute or relative there.
  1104. }
  1105. if (assigned(ref.symbol) and
  1106. not(is_pc(ref.base)) and
  1107. not(is_pc(ref.index))
  1108. ) or
  1109. { [#xxx] isn't a valid address operand }
  1110. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  1111. (ref.offset<-4095) or
  1112. (ref.offset>4095) or
  1113. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  1114. ((ref.offset<-255) or
  1115. (ref.offset>255)
  1116. )
  1117. ) or
  1118. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1119. ((ref.offset<-1020) or
  1120. (ref.offset>1020) or
  1121. ((abs(ref.offset) mod 4)<>0)
  1122. )
  1123. ) or
  1124. ((GenerateThumbCode) and
  1125. (((oppostfix in [PF_SB,PF_SH]) and (ref.offset<>0)) or
  1126. ((oppostfix=PF_None) and ((ref.offset<0) or ((ref.base<>NR_STACK_POINTER_REG) and (ref.offset>124)) or
  1127. ((ref.base=NR_STACK_POINTER_REG) and (ref.offset>1020)) or ((ref.offset mod 4)<>0))) or
  1128. ((oppostfix=PF_H) and ((ref.offset<0) or (ref.offset>62) or ((ref.offset mod 2)<>0) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0)))) or
  1129. ((oppostfix=PF_B) and ((ref.offset<0) or (ref.offset>31) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0))))
  1130. )
  1131. ) then
  1132. begin
  1133. fixref(list,ref);
  1134. end;
  1135. if GenerateThumbCode then
  1136. begin
  1137. { certain thumb load require base and index }
  1138. if (oppostfix in [PF_SB,PF_SH]) and
  1139. (ref.base<>NR_NO) and (ref.index=NR_NO) then
  1140. begin
  1141. tmpreg1:=getintregister(list,OS_ADDR);
  1142. a_load_const_reg(list,OS_ADDR,0,tmpreg1);
  1143. ref.index:=tmpreg1;
  1144. end;
  1145. { "hi" registers cannot be used as base or index }
  1146. if (getsupreg(ref.base) in [RS_R8..RS_R12,RS_R14]) or
  1147. ((ref.base=NR_R13) and (ref.index<>NR_NO)) then
  1148. begin
  1149. tmpreg1:=getintregister(list,OS_ADDR);
  1150. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.base,tmpreg1);
  1151. ref.base:=tmpreg1;
  1152. end;
  1153. if getsupreg(ref.index) in [RS_R8..RS_R14] then
  1154. begin
  1155. tmpreg1:=getintregister(list,OS_ADDR);
  1156. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.index,tmpreg1);
  1157. ref.index:=tmpreg1;
  1158. end;
  1159. end;
  1160. { fold if there is base, index and offset, however, don't fold
  1161. for vfp memory instructions because we later fold the index }
  1162. if not((op in [A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1163. (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  1164. begin
  1165. if tmpreg1<>NR_NO then
  1166. begin
  1167. tmpreg2:=getintregister(list,OS_ADDR);
  1168. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg1,tmpreg2);
  1169. tmpreg1:=tmpreg2;
  1170. end
  1171. else
  1172. begin
  1173. tmpreg1:=getintregister(list,OS_ADDR);
  1174. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg1);
  1175. ref.base:=tmpreg1;
  1176. end;
  1177. ref.offset:=0;
  1178. end;
  1179. { floating point operations have only limited references
  1180. we expect here, that a base is already set }
  1181. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  1182. begin
  1183. if ref.shiftmode<>SM_none then
  1184. internalerror(200309121);
  1185. if tmpreg1<>NR_NO then
  1186. begin
  1187. if ref.base=tmpreg1 then
  1188. begin
  1189. if ref.signindex<0 then
  1190. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,tmpreg1,ref.index))
  1191. else
  1192. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,tmpreg1,ref.index));
  1193. ref.index:=NR_NO;
  1194. end
  1195. else
  1196. begin
  1197. if ref.index<>tmpreg1 then
  1198. internalerror(200403161);
  1199. if ref.signindex<0 then
  1200. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,ref.base,tmpreg1))
  1201. else
  1202. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,tmpreg1));
  1203. ref.base:=tmpreg1;
  1204. ref.index:=NR_NO;
  1205. end;
  1206. end
  1207. else
  1208. begin
  1209. tmpreg1:=getintregister(list,OS_ADDR);
  1210. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,ref.index));
  1211. ref.base:=tmpreg1;
  1212. ref.index:=NR_NO;
  1213. end;
  1214. end;
  1215. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  1216. Result := ref;
  1217. end;
  1218. procedure tbasecgarm.a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);
  1219. var
  1220. oppostfix:toppostfix;
  1221. usedtmpref: treference;
  1222. tmpreg : tregister;
  1223. dir : integer;
  1224. begin
  1225. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  1226. FromSize := ToSize;
  1227. case ToSize of
  1228. { signed integer registers }
  1229. OS_8,
  1230. OS_S8:
  1231. oppostfix:=PF_B;
  1232. OS_16,
  1233. OS_S16:
  1234. oppostfix:=PF_H;
  1235. OS_32,
  1236. OS_S32,
  1237. { for vfp value stored in integer register }
  1238. OS_F32:
  1239. oppostfix:=PF_None;
  1240. else
  1241. InternalError(2003082912);
  1242. end;
  1243. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[tosize])) or
  1244. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  1245. (oppostfix =PF_H)) then
  1246. begin
  1247. if target_info.endian=endian_big then
  1248. dir:=-1
  1249. else
  1250. dir:=1;
  1251. case FromSize of
  1252. OS_16,OS_S16:
  1253. begin
  1254. tmpreg:=getintregister(list,OS_INT);
  1255. usedtmpref:=ref;
  1256. if target_info.endian=endian_big then
  1257. inc(usedtmpref.offset,1);
  1258. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1259. inc(usedtmpref.offset,dir);
  1260. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1261. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1262. end;
  1263. OS_32,OS_S32:
  1264. begin
  1265. tmpreg:=getintregister(list,OS_INT);
  1266. usedtmpref:=ref;
  1267. if ref.alignment=2 then
  1268. begin
  1269. if target_info.endian=endian_big then
  1270. inc(usedtmpref.offset,2);
  1271. usedtmpref:=a_internal_load_reg_ref(list,OS_16,OS_16,reg,usedtmpref);
  1272. a_op_const_reg_reg(list,OP_SHR,OS_INT,16,reg,tmpreg);
  1273. inc(usedtmpref.offset,dir*2);
  1274. a_internal_load_reg_ref(list,OS_16,OS_16,tmpreg,usedtmpref);
  1275. end
  1276. else
  1277. begin
  1278. if target_info.endian=endian_big then
  1279. inc(usedtmpref.offset,3);
  1280. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1281. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1282. inc(usedtmpref.offset,dir);
  1283. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1284. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1285. inc(usedtmpref.offset,dir);
  1286. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1287. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1288. inc(usedtmpref.offset,dir);
  1289. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1290. end;
  1291. end
  1292. else
  1293. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1294. end;
  1295. end
  1296. else
  1297. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1298. end;
  1299. function tbasecgarm.a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  1300. var
  1301. oppostfix:toppostfix;
  1302. href: treference;
  1303. tmpreg: TRegister;
  1304. begin
  1305. case ToSize of
  1306. { signed integer registers }
  1307. OS_8,
  1308. OS_S8:
  1309. oppostfix:=PF_B;
  1310. OS_16,
  1311. OS_S16:
  1312. oppostfix:=PF_H;
  1313. OS_32,
  1314. OS_S32:
  1315. oppostfix:=PF_None;
  1316. else
  1317. InternalError(2003082910);
  1318. end;
  1319. if (tosize in [OS_S16,OS_16]) and
  1320. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1321. begin
  1322. result:=handle_load_store(list,A_STR,PF_B,reg,ref);
  1323. tmpreg:=getintregister(list,OS_INT);
  1324. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1325. href:=result;
  1326. inc(href.offset);
  1327. handle_load_store(list,A_STR,PF_B,tmpreg,href);
  1328. end
  1329. else
  1330. result:=handle_load_store(list,A_STR,oppostfix,reg,ref);
  1331. end;
  1332. function tbasecgarm.a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  1333. var
  1334. oppostfix:toppostfix;
  1335. so: tshifterop;
  1336. tmpreg: TRegister;
  1337. href: treference;
  1338. begin
  1339. case FromSize of
  1340. { signed integer registers }
  1341. OS_8:
  1342. oppostfix:=PF_B;
  1343. OS_S8:
  1344. oppostfix:=PF_SB;
  1345. OS_16:
  1346. oppostfix:=PF_H;
  1347. OS_S16:
  1348. oppostfix:=PF_SH;
  1349. OS_32,
  1350. OS_S32:
  1351. oppostfix:=PF_None;
  1352. else
  1353. InternalError(200308291);
  1354. end;
  1355. if (tosize=OS_S8) and
  1356. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1357. begin
  1358. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1359. a_load_reg_reg(list,OS_S8,OS_32,reg,reg);
  1360. end
  1361. else if (tosize in [OS_S16,OS_16]) and
  1362. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1363. begin
  1364. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1365. tmpreg:=getintregister(list,OS_INT);
  1366. href:=result;
  1367. inc(href.offset);
  1368. handle_load_store(list,A_LDR,PF_B,tmpreg,href);
  1369. shifterop_reset(so);
  1370. so.shiftmode:=SM_LSL;
  1371. so.shiftimm:=8;
  1372. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  1373. end
  1374. else
  1375. result:=handle_load_store(list,A_LDR,oppostfix,reg,ref);
  1376. end;
  1377. procedure tbasecgarm.a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);
  1378. var
  1379. so : tshifterop;
  1380. procedure do_shift(shiftmode : tshiftmode; shiftimm : byte; reg : tregister);
  1381. begin
  1382. if GenerateThumbCode then
  1383. begin
  1384. case shiftmode of
  1385. SM_ASR:
  1386. a_op_const_reg_reg(list,OP_SAR,OS_32,shiftimm,reg,reg2);
  1387. SM_LSR:
  1388. a_op_const_reg_reg(list,OP_SHR,OS_32,shiftimm,reg,reg2);
  1389. SM_LSL:
  1390. a_op_const_reg_reg(list,OP_SHL,OS_32,shiftimm,reg,reg2);
  1391. else
  1392. internalerror(2013090301);
  1393. end;
  1394. end
  1395. else
  1396. begin
  1397. so.shiftmode:=shiftmode;
  1398. so.shiftimm:=shiftimm;
  1399. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,reg2,reg,so));
  1400. end;
  1401. end;
  1402. var
  1403. instr: taicpu;
  1404. conv_done: boolean;
  1405. begin
  1406. if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then
  1407. internalerror(2002090901);
  1408. conv_done:=false;
  1409. if tosize<>fromsize then
  1410. begin
  1411. shifterop_reset(so);
  1412. conv_done:=true;
  1413. if tcgsize2size[tosize]<=tcgsize2size[fromsize] then
  1414. fromsize:=tosize;
  1415. if current_settings.cputype<cpu_armv6 then
  1416. case fromsize of
  1417. OS_8:
  1418. if GenerateThumbCode then
  1419. a_op_const_reg_reg(list,OP_AND,OS_32,$ff,reg1,reg2)
  1420. else
  1421. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1422. OS_S8:
  1423. begin
  1424. do_shift(SM_LSL,24,reg1);
  1425. if tosize=OS_16 then
  1426. begin
  1427. do_shift(SM_ASR,8,reg2);
  1428. do_shift(SM_LSR,16,reg2);
  1429. end
  1430. else
  1431. do_shift(SM_ASR,24,reg2);
  1432. end;
  1433. OS_16:
  1434. begin
  1435. do_shift(SM_LSL,16,reg1);
  1436. do_shift(SM_LSR,16,reg2);
  1437. end;
  1438. OS_S16:
  1439. begin
  1440. do_shift(SM_LSL,16,reg1);
  1441. do_shift(SM_ASR,16,reg2)
  1442. end;
  1443. else
  1444. conv_done:=false;
  1445. end
  1446. else
  1447. case fromsize of
  1448. OS_8:
  1449. if GenerateThumbCode then
  1450. list.concat(taicpu.op_reg_reg(A_UXTB,reg2,reg1))
  1451. else
  1452. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1453. OS_S8:
  1454. begin
  1455. if tosize=OS_16 then
  1456. begin
  1457. so.shiftmode:=SM_ROR;
  1458. so.shiftimm:=16;
  1459. list.concat(taicpu.op_reg_reg_shifterop(A_SXTB16,reg2,reg1,so));
  1460. do_shift(SM_LSR,16,reg2);
  1461. end
  1462. else
  1463. list.concat(taicpu.op_reg_reg(A_SXTB,reg2,reg1));
  1464. end;
  1465. OS_16:
  1466. list.concat(taicpu.op_reg_reg(A_UXTH,reg2,reg1));
  1467. OS_S16:
  1468. list.concat(taicpu.op_reg_reg(A_SXTH,reg2,reg1));
  1469. else
  1470. conv_done:=false;
  1471. end
  1472. end;
  1473. if not conv_done and (reg1<>reg2) then
  1474. begin
  1475. { same size, only a register mov required }
  1476. instr:=taicpu.op_reg_reg(A_MOV,reg2,reg1);
  1477. list.Concat(instr);
  1478. { Notify the register allocator that we have written a move instruction so
  1479. it can try to eliminate it. }
  1480. add_move_instruction(instr);
  1481. end;
  1482. end;
  1483. procedure tbasecgarm.a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);
  1484. var
  1485. href,href2 : treference;
  1486. hloc : pcgparalocation;
  1487. begin
  1488. href:=ref;
  1489. hloc:=paraloc.location;
  1490. while assigned(hloc) do
  1491. begin
  1492. case hloc^.loc of
  1493. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  1494. begin
  1495. paramanager.allocparaloc(list,paraloc.location);
  1496. a_loadfpu_ref_reg(list,size,size,ref,hloc^.register);
  1497. end;
  1498. LOC_REGISTER :
  1499. case hloc^.size of
  1500. OS_32,
  1501. OS_F32:
  1502. begin
  1503. paramanager.allocparaloc(list,paraloc.location);
  1504. a_load_ref_reg(list,OS_32,OS_32,href,hloc^.register);
  1505. end;
  1506. OS_64,
  1507. OS_F64:
  1508. cg64.a_load64_ref_cgpara(list,href,paraloc);
  1509. else
  1510. a_load_ref_reg(list,hloc^.size,hloc^.size,href,hloc^.register);
  1511. end;
  1512. LOC_REFERENCE :
  1513. begin
  1514. reference_reset_base(href2,hloc^.reference.index,hloc^.reference.offset,ctempposinvalid,paraloc.alignment,[]);
  1515. { concatcopy should choose the best way to copy the data }
  1516. g_concatcopy(list,href,href2,tcgsize2size[hloc^.size]);
  1517. end;
  1518. else
  1519. internalerror(200408241);
  1520. end;
  1521. inc(href.offset,tcgsize2size[hloc^.size]);
  1522. hloc:=hloc^.next;
  1523. end;
  1524. end;
  1525. procedure tbasecgarm.a_loadfpu_reg_reg(list: TAsmList; fromsize,tosize: tcgsize; reg1, reg2: tregister);
  1526. begin
  1527. list.concat(setoppostfix(taicpu.op_reg_reg(A_MVF,reg2,reg1),cgsize2fpuoppostfix[tosize]));
  1528. end;
  1529. procedure tbasecgarm.a_loadfpu_ref_reg(list: TAsmList; fromsize,tosize: tcgsize; const ref: treference; reg: tregister);
  1530. var
  1531. oppostfix:toppostfix;
  1532. begin
  1533. case fromsize of
  1534. OS_32,
  1535. OS_F32:
  1536. oppostfix:=PF_S;
  1537. OS_64,
  1538. OS_F64:
  1539. oppostfix:=PF_D;
  1540. OS_F80:
  1541. oppostfix:=PF_E;
  1542. else
  1543. InternalError(200309021);
  1544. end;
  1545. handle_load_store(list,A_LDF,oppostfix,reg,ref);
  1546. if fromsize<>tosize then
  1547. a_loadfpu_reg_reg(list,fromsize,tosize,reg,reg);
  1548. end;
  1549. procedure tbasecgarm.a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);
  1550. var
  1551. oppostfix:toppostfix;
  1552. begin
  1553. case tosize of
  1554. OS_F32:
  1555. oppostfix:=PF_S;
  1556. OS_F64:
  1557. oppostfix:=PF_D;
  1558. OS_F80:
  1559. oppostfix:=PF_E;
  1560. else
  1561. InternalError(200309022);
  1562. end;
  1563. handle_load_store(list,A_STF,oppostfix,reg,ref);
  1564. end;
  1565. procedure tbasecgarm.g_check_for_fpu_exception(list: TAsmList;force,clear : boolean);
  1566. var
  1567. r : TRegister;
  1568. ai: taicpu;
  1569. l: TAsmLabel;
  1570. begin
  1571. if ((cs_check_fpu_exceptions in current_settings.localswitches) and
  1572. not(FPUARM_HAS_EXCEPTION_TRAPPING in fpu_capabilities[current_settings.fputype]) and
  1573. (force or current_procinfo.FPUExceptionCheckNeeded)) then
  1574. begin
  1575. r:=getintregister(list,OS_INT);
  1576. list.concat(taicpu.op_reg_reg(A_FMRX,r,NR_FPSCR));
  1577. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_AND,r,r,$9f),PF_S));
  1578. current_asmdata.getjumplabel(l);
  1579. ai:=taicpu.op_sym(A_B,l);
  1580. ai.is_jmp:=true;
  1581. ai.condition:=C_EQ;
  1582. list.concat(ai);
  1583. alloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  1584. cg.a_call_name(list,'FPC_THROWFPUEXCEPTION',false);
  1585. dealloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  1586. a_label(list,l);
  1587. if clear then
  1588. current_procinfo.FPUExceptionCheckNeeded:=false;
  1589. end;
  1590. end;
  1591. { comparison operations }
  1592. procedure tbasecgarm.a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  1593. l : tasmlabel);
  1594. var
  1595. tmpreg : tregister;
  1596. b : byte;
  1597. begin
  1598. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1599. if (not(GenerateThumbCode) and is_shifter_const(a,b)) or
  1600. ((GenerateThumbCode) and is_thumb_imm(a)) then
  1601. list.concat(taicpu.op_reg_const(A_CMP,reg,a))
  1602. { CMN reg,0 and CMN reg,$80000000 are different from CMP reg,$ffffffff
  1603. and CMP reg,$7fffffff regarding the flags according to the ARM manual }
  1604. else if (a<>$7fffffff) and (a<>-1) and not(GenerateThumbCode) and is_shifter_const(-a,b) then
  1605. list.concat(taicpu.op_reg_const(A_CMN,reg,-a))
  1606. else
  1607. begin
  1608. tmpreg:=getintregister(list,size);
  1609. a_load_const_reg(list,size,a,tmpreg);
  1610. list.concat(taicpu.op_reg_reg(A_CMP,reg,tmpreg));
  1611. end;
  1612. a_jmp_cond(list,cmp_op,l);
  1613. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1614. end;
  1615. procedure tbasecgarm.a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister);
  1616. begin
  1617. if reverse then
  1618. begin
  1619. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,src));
  1620. list.Concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,31));
  1621. list.Concat(taicpu.op_reg_reg_const(A_AND,dst,dst,255));
  1622. end
  1623. { it is decided during the compilation of the system unit if this code is used or not
  1624. so no additional check for rbit is needed }
  1625. else
  1626. begin
  1627. list.Concat(taicpu.op_reg_reg(A_RBIT,dst,src));
  1628. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,dst));
  1629. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1630. list.Concat(taicpu.op_reg_const(A_CMP,dst,32));
  1631. if GenerateThumb2Code then
  1632. list.Concat(taicpu.op_cond(A_IT, C_EQ));
  1633. list.Concat(setcondition(taicpu.op_reg_const(A_MOV,dst,$ff),C_EQ));
  1634. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1635. end;
  1636. end;
  1637. procedure tbasecgarm.a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel);
  1638. begin
  1639. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1640. list.concat(taicpu.op_reg_reg(A_CMP,reg2,reg1));
  1641. a_jmp_cond(list,cmp_op,l);
  1642. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1643. end;
  1644. procedure tbasecgarm.a_jmp_name(list : TAsmList;const s : string);
  1645. var
  1646. ai : taicpu;
  1647. begin
  1648. { generate far jump, leave it to the optimizer to get rid of it }
  1649. if GenerateThumbCode then
  1650. ai:=taicpu.op_sym(A_BL,current_asmdata.RefAsmSymbol(s,AT_FUNCTION))
  1651. else
  1652. ai:=taicpu.op_sym(A_B,current_asmdata.RefAsmSymbol(s,AT_FUNCTION));
  1653. ai.is_jmp:=true;
  1654. list.concat(ai);
  1655. end;
  1656. procedure tbasecgarm.a_jmp_always(list : TAsmList;l: tasmlabel);
  1657. var
  1658. ai : taicpu;
  1659. begin
  1660. { generate far jump, leave it to the optimizer to get rid of it }
  1661. if GenerateThumbCode then
  1662. ai:=taicpu.op_sym(A_BL,l)
  1663. else
  1664. ai:=taicpu.op_sym(A_B,l);
  1665. ai.is_jmp:=true;
  1666. list.concat(ai);
  1667. end;
  1668. procedure tbasecgarm.a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel);
  1669. var
  1670. ai : taicpu;
  1671. inv_flags : TResFlags;
  1672. hlabel : TAsmLabel;
  1673. begin
  1674. if GenerateThumbCode then
  1675. begin
  1676. inv_flags:=f;
  1677. inverse_flags(inv_flags);
  1678. { the optimizer has to fix this if jump range is sufficient short }
  1679. current_asmdata.getjumplabel(hlabel);
  1680. ai:=setcondition(taicpu.op_sym(A_B,hlabel),flags_to_cond(inv_flags));
  1681. ai.is_jmp:=true;
  1682. list.concat(ai);
  1683. a_jmp_always(list,l);
  1684. a_label(list,hlabel);
  1685. end
  1686. else
  1687. begin
  1688. ai:=setcondition(taicpu.op_sym(A_B,l),flags_to_cond(f));
  1689. ai.is_jmp:=true;
  1690. list.concat(ai);
  1691. end;
  1692. end;
  1693. procedure tbasecgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  1694. begin
  1695. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  1696. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  1697. end;
  1698. procedure tbasecgarm.g_profilecode(list : TAsmList);
  1699. begin
  1700. if target_info.system = system_arm_linux then
  1701. begin
  1702. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R14]));
  1703. a_call_name(list,'__gnu_mcount_nc',false);
  1704. end
  1705. else
  1706. internalerror(2014091201);
  1707. end;
  1708. procedure tbasecgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  1709. var
  1710. ref : treference;
  1711. shift : byte;
  1712. firstfloatreg,lastfloatreg,
  1713. r : byte;
  1714. mmregs,
  1715. regs, saveregs : tcpuregisterset;
  1716. registerarea,
  1717. r7offset,
  1718. stackmisalignment : pint;
  1719. imm1, imm2: DWord;
  1720. stack_parameters : Boolean;
  1721. begin
  1722. LocalSize:=align(LocalSize,4);
  1723. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  1724. { call instruction does not put anything on the stack }
  1725. registerarea:=0;
  1726. tcpuprocinfo(current_procinfo).stackpaddingreg:=High(TSuperRegister);
  1727. lastfloatreg:=RS_NO;
  1728. if not(nostackframe) then
  1729. begin
  1730. firstfloatreg:=RS_NO;
  1731. mmregs:=[];
  1732. case current_settings.fputype of
  1733. fpu_none,
  1734. fpu_soft,
  1735. fpu_libgcc:
  1736. ;
  1737. fpu_fpa,
  1738. fpu_fpa10,
  1739. fpu_fpa11:
  1740. begin
  1741. { save floating point registers? }
  1742. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1743. for r:=RS_F0 to RS_F7 do
  1744. if r in regs then
  1745. begin
  1746. if firstfloatreg=RS_NO then
  1747. firstfloatreg:=r;
  1748. lastfloatreg:=r;
  1749. inc(registerarea,12);
  1750. end;
  1751. end;
  1752. else if FPUARM_HAS_32REGS in fpu_capabilities[current_settings.fputype] then
  1753. begin;
  1754. { the *[0..31] is a hack to prevent that the compiler tries to save odd single-type registers,
  1755. they have numbers>$1f which is not really correct as they should simply have the same numbers
  1756. as the even ones by with a different subtype as it is done on x86 with al/ah }
  1757. mmregs:=(rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall))*[0..31];
  1758. end
  1759. else if FPUARM_HAS_VFP_EXTENSION in fpu_capabilities[current_settings.fputype] then
  1760. begin;
  1761. { the *[0..15] is a hack to prevent that the compiler tries to save odd single-type registers,
  1762. they have numbers>$1f which is not really correct as they should simply have the same numbers
  1763. as the even ones by with a different subtype as it is done on x86 with al/ah }
  1764. mmregs:=(rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall))*[0..15];
  1765. end
  1766. else
  1767. internalerror(2019050924);
  1768. end;
  1769. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1770. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1771. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  1772. { save int registers }
  1773. reference_reset(ref,4,[]);
  1774. ref.index:=NR_STACK_POINTER_REG;
  1775. ref.addressmode:=AM_PREINDEXED;
  1776. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  1777. if not(target_info.system in systems_darwin) then
  1778. begin
  1779. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1780. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1781. begin
  1782. a_reg_alloc(list,NR_R12);
  1783. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  1784. end;
  1785. { the (old) ARM APCS requires saving both the stack pointer (to
  1786. crawl the stack) and the PC (to identify the function this
  1787. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  1788. and R15 -- still needs updating for EABI and Darwin, they don't
  1789. need that }
  1790. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1791. regs:=regs+[RS_FRAME_POINTER_REG,RS_R12,RS_R14,RS_R15]
  1792. else
  1793. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1794. include(regs,RS_R14);
  1795. if regs<>[] then
  1796. begin
  1797. for r:=RS_R0 to RS_R15 do
  1798. if r in regs then
  1799. inc(registerarea,4);
  1800. { if the stack is not 8 byte aligned, try to add an extra register,
  1801. so we can avoid the extra sub/add ...,#4 later (KB) }
  1802. if ((registerarea mod current_settings.alignment.localalignmax) <> 0) then
  1803. for r:=RS_R3 downto RS_R0 do
  1804. if not(r in regs) then
  1805. begin
  1806. regs:=regs+[r];
  1807. inc(registerarea,4);
  1808. tcpuprocinfo(current_procinfo).stackpaddingreg:=r;
  1809. break;
  1810. end;
  1811. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  1812. end;
  1813. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1814. begin
  1815. { the framepointer now points to the saved R15, so the saved
  1816. framepointer is at R11-12 (for get_caller_frame) }
  1817. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  1818. a_reg_dealloc(list,NR_R12);
  1819. end;
  1820. end
  1821. else
  1822. begin
  1823. { always save r14 if we use r7 as the framepointer, because
  1824. the parameter offsets are hardcoded in advance and always
  1825. assume that r14 sits on the stack right behind the saved r7
  1826. }
  1827. if current_procinfo.framepointer=NR_FRAME_POINTER_REG then
  1828. include(regs,RS_FRAME_POINTER_REG);
  1829. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1830. include(regs,RS_R14);
  1831. if regs<>[] then
  1832. begin
  1833. { on Darwin, you first have to save [r4-r7,lr], and then
  1834. [r8,r10,r11] and make r7 point to the previously saved
  1835. r7 so that you can perform a stack crawl based on it
  1836. ([r7] is previous stack frame, [r7+4] is return address
  1837. }
  1838. include(regs,RS_FRAME_POINTER_REG);
  1839. saveregs:=regs-[RS_R8,RS_R10,RS_R11];
  1840. r7offset:=0;
  1841. for r:=RS_R0 to RS_R15 do
  1842. if r in saveregs then
  1843. begin
  1844. inc(registerarea,4);
  1845. if r<RS_FRAME_POINTER_REG then
  1846. inc(r7offset,4);
  1847. end;
  1848. { save the registers }
  1849. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1850. { make r7 point to the saved r7 (regardless of whether this
  1851. frame uses the framepointer, for backtrace purposes) }
  1852. if r7offset<>0 then
  1853. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_FRAME_POINTER_REG,NR_R13,r7offset))
  1854. else
  1855. list.concat(taicpu.op_reg_reg(A_MOV,NR_R7,NR_R13));
  1856. { now save the rest (if any) }
  1857. saveregs:=regs-saveregs;
  1858. if saveregs<>[] then
  1859. begin
  1860. for r:=RS_R8 to RS_R11 do
  1861. if r in saveregs then
  1862. inc(registerarea,4);
  1863. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1864. end;
  1865. end;
  1866. end;
  1867. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  1868. if (LocalSize<>0) or
  1869. ((stackmisalignment<>0) and
  1870. ((pi_do_call in current_procinfo.flags) or
  1871. (po_assembler in current_procinfo.procdef.procoptions))) then
  1872. begin
  1873. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  1874. if stack_parameters and (pi_estimatestacksize in current_procinfo.flags) then
  1875. begin
  1876. if localsize>tcpuprocinfo(current_procinfo).stackframesize then
  1877. internalerror(2014030901)
  1878. else
  1879. localsize:=tcpuprocinfo(current_procinfo).stackframesize-registerarea;
  1880. end;
  1881. if is_shifter_const(localsize,shift) then
  1882. begin
  1883. a_reg_dealloc(list,NR_R12);
  1884. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  1885. end
  1886. else if split_into_shifter_const(localsize, imm1, imm2) then
  1887. begin
  1888. a_reg_dealloc(list,NR_R12);
  1889. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  1890. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  1891. end
  1892. else
  1893. begin
  1894. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  1895. a_reg_alloc(list,NR_R12);
  1896. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  1897. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  1898. a_reg_dealloc(list,NR_R12);
  1899. end;
  1900. end;
  1901. if (mmregs<>[]) or
  1902. (firstfloatreg<>RS_NO) then
  1903. begin
  1904. reference_reset(ref,4,[]);
  1905. if (tg.direction*tcpuprocinfo(current_procinfo).floatregstart>=1023) or
  1906. (FPUARM_HAS_VFP_EXTENSION in fpu_capabilities[current_settings.fputype]) then
  1907. begin
  1908. if not is_shifter_const(tcpuprocinfo(current_procinfo).floatregstart,shift) then
  1909. begin
  1910. a_reg_alloc(list,NR_R12);
  1911. a_load_const_reg(list,OS_ADDR,-tcpuprocinfo(current_procinfo).floatregstart,NR_R12);
  1912. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1913. a_reg_dealloc(list,NR_R12);
  1914. end
  1915. else
  1916. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tcpuprocinfo(current_procinfo).floatregstart));
  1917. ref.base:=NR_R12;
  1918. end
  1919. else
  1920. begin
  1921. ref.base:=current_procinfo.framepointer;
  1922. ref.offset:=tcpuprocinfo(current_procinfo).floatregstart;
  1923. end;
  1924. case current_settings.fputype of
  1925. fpu_fpa,
  1926. fpu_fpa10,
  1927. fpu_fpa11:
  1928. begin
  1929. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  1930. lastfloatreg-firstfloatreg+1,ref));
  1931. end;
  1932. else if FPUARM_HAS_VFP_DOUBLE in fpu_capabilities[current_settings.fputype] then
  1933. begin
  1934. ref.index:=ref.base;
  1935. ref.base:=NR_NO;
  1936. if mmregs<>[] then
  1937. list.concat(taicpu.op_ref_regset(A_VSTM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  1938. end
  1939. else if FPUARM_HAS_VFP_EXTENSION in fpu_capabilities[current_settings.fputype] then
  1940. begin
  1941. ref.index:=ref.base;
  1942. ref.base:=NR_NO;
  1943. if mmregs<>[] then
  1944. list.concat(taicpu.op_ref_regset(A_VSTM,ref,R_MMREGISTER,R_SUBFS,mmregs));
  1945. end
  1946. else
  1947. internalerror(2019050923);
  1948. end;
  1949. end;
  1950. end;
  1951. end;
  1952. procedure tbasecgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  1953. var
  1954. ref : treference;
  1955. LocalSize : longint;
  1956. firstfloatreg,lastfloatreg,
  1957. r,
  1958. shift : byte;
  1959. mmregs,
  1960. saveregs,
  1961. regs : tcpuregisterset;
  1962. registerarea,
  1963. stackmisalignment: pint;
  1964. paddingreg: TSuperRegister;
  1965. imm1, imm2: DWord;
  1966. begin
  1967. if not(nostackframe) then
  1968. begin
  1969. registerarea:=0;
  1970. firstfloatreg:=RS_NO;
  1971. lastfloatreg:=RS_NO;
  1972. mmregs:=[];
  1973. saveregs:=[];
  1974. case current_settings.fputype of
  1975. fpu_none,
  1976. fpu_soft,
  1977. fpu_libgcc:
  1978. ;
  1979. fpu_fpa,
  1980. fpu_fpa10,
  1981. fpu_fpa11:
  1982. begin
  1983. { restore floating point registers? }
  1984. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1985. for r:=RS_F0 to RS_F7 do
  1986. if r in regs then
  1987. begin
  1988. if firstfloatreg=RS_NO then
  1989. firstfloatreg:=r;
  1990. lastfloatreg:=r;
  1991. { floating point register space is already included in
  1992. localsize below by calc_stackframe_size
  1993. inc(registerarea,12);
  1994. }
  1995. end;
  1996. end;
  1997. else if FPUARM_HAS_VFP_EXTENSION in fpu_capabilities[current_settings.fputype] then
  1998. begin
  1999. { restore vfp registers? }
  2000. { the *[0..31] is a hack to prevent that the compiler tries to save odd single-type registers,
  2001. they have numbers>$1f which is not really correct as they should simply have the same numbers
  2002. as the even ones by with a different subtype as it is done on x86 with al/ah }
  2003. mmregs:=(rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall))*[0..31];
  2004. end
  2005. else
  2006. internalerror(2019050908);
  2007. end;
  2008. if (firstfloatreg<>RS_NO) or
  2009. (mmregs<>[]) then
  2010. begin
  2011. reference_reset(ref,4,[]);
  2012. if (tg.direction*tcpuprocinfo(current_procinfo).floatregstart>=1023) or
  2013. (FPUARM_HAS_VFP_EXTENSION in fpu_capabilities[current_settings.fputype]) then
  2014. begin
  2015. if not is_shifter_const(tcpuprocinfo(current_procinfo).floatregstart,shift) then
  2016. begin
  2017. a_reg_alloc(list,NR_R12);
  2018. a_load_const_reg(list,OS_ADDR,-tcpuprocinfo(current_procinfo).floatregstart,NR_R12);
  2019. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  2020. a_reg_dealloc(list,NR_R12);
  2021. end
  2022. else
  2023. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tcpuprocinfo(current_procinfo).floatregstart));
  2024. ref.base:=NR_R12;
  2025. end
  2026. else
  2027. begin
  2028. ref.base:=current_procinfo.framepointer;
  2029. ref.offset:=tcpuprocinfo(current_procinfo).floatregstart;
  2030. end;
  2031. case current_settings.fputype of
  2032. fpu_fpa,
  2033. fpu_fpa10,
  2034. fpu_fpa11:
  2035. begin
  2036. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  2037. lastfloatreg-firstfloatreg+1,ref));
  2038. end;
  2039. else if FPUARM_HAS_VFP_DOUBLE in fpu_capabilities[current_settings.fputype] then
  2040. begin
  2041. ref.index:=ref.base;
  2042. ref.base:=NR_NO;
  2043. if mmregs<>[] then
  2044. list.concat(taicpu.op_ref_regset(A_VLDM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  2045. end
  2046. else if FPUARM_HAS_VFP_EXTENSION in fpu_capabilities[current_settings.fputype] then
  2047. begin
  2048. ref.index:=ref.base;
  2049. ref.base:=NR_NO;
  2050. if mmregs<>[] then
  2051. list.concat(taicpu.op_ref_regset(A_VLDM,ref,R_MMREGISTER,R_SUBFS,mmregs));
  2052. end
  2053. else
  2054. internalerror(2019050921);
  2055. end;
  2056. end;
  2057. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  2058. if (pi_do_call in current_procinfo.flags) or
  2059. (regs<>[]) or
  2060. ((target_info.system in systems_darwin) and
  2061. (current_procinfo.framepointer<>NR_STACK_POINTER_REG)) then
  2062. begin
  2063. exclude(regs,RS_R14);
  2064. include(regs,RS_R15);
  2065. if (target_info.system in systems_darwin) then
  2066. include(regs,RS_FRAME_POINTER_REG);
  2067. end;
  2068. if not(target_info.system in systems_darwin) then
  2069. begin
  2070. { restore saved stack pointer to SP (R13) and saved lr to PC (R15).
  2071. The saved PC came after that but is discarded, since we restore
  2072. the stack pointer }
  2073. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  2074. regs:=regs+[RS_FRAME_POINTER_REG,RS_R13,RS_R15];
  2075. end
  2076. else
  2077. begin
  2078. { restore R8-R11 already if necessary (they've been stored
  2079. before the others) }
  2080. saveregs:=regs*[RS_R8,RS_R10,RS_R11];
  2081. if saveregs<>[] then
  2082. begin
  2083. reference_reset(ref,4,[]);
  2084. ref.index:=NR_STACK_POINTER_REG;
  2085. ref.addressmode:=AM_PREINDEXED;
  2086. for r:=RS_R8 to RS_R11 do
  2087. if r in saveregs then
  2088. inc(registerarea,4);
  2089. regs:=regs-saveregs;
  2090. end;
  2091. end;
  2092. for r:=RS_R0 to RS_R15 do
  2093. if r in regs then
  2094. inc(registerarea,4);
  2095. { reapply the stack padding reg, in case there was one, see the complimentary
  2096. comment in g_proc_entry() (KB) }
  2097. paddingreg:=tcpuprocinfo(current_procinfo).stackpaddingreg;
  2098. if paddingreg < RS_R4 then
  2099. if paddingreg in regs then
  2100. internalerror(201306190)
  2101. else
  2102. begin
  2103. regs:=regs+[paddingreg];
  2104. inc(registerarea,4);
  2105. end;
  2106. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  2107. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  2108. (target_info.system in systems_darwin) then
  2109. begin
  2110. LocalSize:=current_procinfo.calc_stackframe_size;
  2111. if (LocalSize<>0) or
  2112. ((stackmisalignment<>0) and
  2113. ((pi_do_call in current_procinfo.flags) or
  2114. (po_assembler in current_procinfo.procdef.procoptions))) then
  2115. begin
  2116. if pi_estimatestacksize in current_procinfo.flags then
  2117. LocalSize:=tcpuprocinfo(current_procinfo).stackframesize-registerarea
  2118. else
  2119. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  2120. if is_shifter_const(LocalSize,shift) then
  2121. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  2122. else if split_into_shifter_const(localsize, imm1, imm2) then
  2123. begin
  2124. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  2125. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  2126. end
  2127. else
  2128. begin
  2129. a_reg_alloc(list,NR_R12);
  2130. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  2131. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  2132. a_reg_dealloc(list,NR_R12);
  2133. end;
  2134. end;
  2135. if (target_info.system in systems_darwin) and
  2136. (saveregs<>[]) then
  2137. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  2138. if regs=[] then
  2139. begin
  2140. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2141. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2142. else
  2143. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2144. end
  2145. else
  2146. begin
  2147. reference_reset(ref,4,[]);
  2148. ref.index:=NR_STACK_POINTER_REG;
  2149. ref.addressmode:=AM_PREINDEXED;
  2150. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  2151. end;
  2152. end
  2153. else
  2154. begin
  2155. { restore int registers and return }
  2156. reference_reset(ref,4,[]);
  2157. ref.index:=NR_FRAME_POINTER_REG;
  2158. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_EA));
  2159. end;
  2160. end
  2161. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2162. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2163. else
  2164. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2165. end;
  2166. procedure tbasecgarm.g_maybe_got_init(list : TAsmList);
  2167. var
  2168. ref : treference;
  2169. l : TAsmLabel;
  2170. regs : tcpuregisterset;
  2171. r: byte;
  2172. begin
  2173. if (cs_create_pic in current_settings.moduleswitches) and
  2174. (pi_needs_got in current_procinfo.flags) and
  2175. (tf_pic_uses_got in target_info.flags) then
  2176. begin
  2177. { Procedure parametrs are not initialized at this stage.
  2178. Before GOT initialization code, allocate registers used for procedure parameters
  2179. to prevent usage of these registers for temp operations in later stages of code
  2180. generation. }
  2181. regs:=rg[R_INTREGISTER].used_in_proc;
  2182. for r:=RS_R0 to RS_R3 do
  2183. if r in regs then
  2184. a_reg_alloc(list, newreg(R_INTREGISTER,r,R_SUBWHOLE));
  2185. { Allocate scratch register R12 and use it for GOT calculations directly.
  2186. Otherwise the init code can be distorted in later stages of code generation. }
  2187. a_reg_alloc(list,NR_R12);
  2188. reference_reset(ref,4,[]);
  2189. current_asmdata.getglobaldatalabel(l);
  2190. cg.a_label(current_procinfo.aktlocaldata,l);
  2191. ref.symbol:=l;
  2192. ref.base:=NR_PC;
  2193. ref.symboldata:=current_procinfo.aktlocaldata.last;
  2194. list.concat(Taicpu.op_reg_ref(A_LDR,NR_R12,ref));
  2195. current_asmdata.getaddrlabel(l);
  2196. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_32bit,l,current_asmdata.RefAsmSymbol('_GLOBAL_OFFSET_TABLE_',AT_DATA),-8));
  2197. cg.a_label(list,l);
  2198. list.concat(Taicpu.op_reg_reg_reg(A_ADD,NR_R12,NR_PC,NR_R12));
  2199. list.concat(Taicpu.op_reg_reg(A_MOV,current_procinfo.got,NR_R12));
  2200. { Deallocate registers }
  2201. a_reg_dealloc(list,NR_R12);
  2202. for r:=RS_R3 downto RS_R0 do
  2203. if r in regs then
  2204. a_reg_dealloc(list, newreg(R_INTREGISTER,r,R_SUBWHOLE));
  2205. end;
  2206. end;
  2207. procedure tbasecgarm.a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);
  2208. var
  2209. b : byte;
  2210. tmpref : treference;
  2211. instr : taicpu;
  2212. begin
  2213. if ref.addressmode<>AM_OFFSET then
  2214. internalerror(200309071);
  2215. tmpref:=ref;
  2216. { Be sure to have a base register }
  2217. if (tmpref.base=NR_NO) then
  2218. begin
  2219. if tmpref.shiftmode<>SM_None then
  2220. internalerror(2014020702);
  2221. if tmpref.signindex<0 then
  2222. internalerror(200312023);
  2223. tmpref.base:=tmpref.index;
  2224. tmpref.index:=NR_NO;
  2225. end;
  2226. if assigned(tmpref.symbol) or
  2227. not((is_shifter_const(tmpref.offset,b)) or
  2228. (is_shifter_const(-tmpref.offset,b))
  2229. ) then
  2230. fixref(list,tmpref);
  2231. { expect a base here if there is an index }
  2232. if (tmpref.base=NR_NO) and (tmpref.index<>NR_NO) then
  2233. internalerror(200312022);
  2234. if tmpref.index<>NR_NO then
  2235. begin
  2236. if tmpref.shiftmode<>SM_None then
  2237. internalerror(200312021);
  2238. if tmpref.signindex<0 then
  2239. a_op_reg_reg_reg(list,OP_SUB,OS_ADDR,tmpref.base,tmpref.index,r)
  2240. else
  2241. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpref.base,tmpref.index,r);
  2242. if tmpref.offset<>0 then
  2243. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,r,r);
  2244. end
  2245. else
  2246. begin
  2247. if tmpref.base=NR_NO then
  2248. a_load_const_reg(list,OS_ADDR,tmpref.offset,r)
  2249. else
  2250. if tmpref.offset<>0 then
  2251. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,tmpref.base,r)
  2252. else
  2253. begin
  2254. instr:=taicpu.op_reg_reg(A_MOV,r,tmpref.base);
  2255. list.concat(instr);
  2256. add_move_instruction(instr);
  2257. end;
  2258. end;
  2259. end;
  2260. procedure tbasecgarm.fixref(list : TAsmList;var ref : treference);
  2261. var
  2262. tmpreg, tmpreg2 : tregister;
  2263. tmpref : treference;
  2264. l, piclabel : tasmlabel;
  2265. indirection_done : boolean;
  2266. begin
  2267. { absolute symbols can't be handled directly, we've to store the symbol reference
  2268. in the text segment and access it pc relative
  2269. For now, we assume that references where base or index equals to PC are already
  2270. relative, all other references are assumed to be absolute and thus they need
  2271. to be handled extra.
  2272. A proper solution would be to change refoptions to a set and store the information
  2273. if the symbol is absolute or relative there.
  2274. }
  2275. { create consts entry }
  2276. reference_reset(tmpref,4,[]);
  2277. current_asmdata.getjumplabel(l);
  2278. cg.a_label(current_procinfo.aktlocaldata,l);
  2279. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  2280. piclabel:=nil;
  2281. tmpreg:=NR_NO;
  2282. indirection_done:=false;
  2283. if assigned(ref.symbol) then
  2284. begin
  2285. if (target_info.system=system_arm_ios) and
  2286. (ref.symbol.bind in [AB_EXTERNAL,AB_WEAK_EXTERNAL,AB_PRIVATE_EXTERN,AB_COMMON]) then
  2287. begin
  2288. tmpreg:=g_indirect_sym_load(list,ref.symbol.name,asmsym2indsymflags(ref.symbol));
  2289. if ref.offset<>0 then
  2290. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2291. indirection_done:=true;
  2292. end
  2293. else if ref.refaddr=addr_gottpoff then
  2294. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_gottpoff,ref.symbol,ref.relsymbol,ref.offset))
  2295. else if ref.refaddr=addr_tlsgd then
  2296. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_tlsgd,ref.symbol,ref.relsymbol,ref.offset))
  2297. else if ref.refaddr=addr_tlsdesc then
  2298. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_tlsdesc,ref.symbol,ref.relsymbol,ref.offset))
  2299. else if ref.refaddr=addr_tpoff then
  2300. begin
  2301. if assigned(ref.relsymbol) or (ref.offset<>0) then
  2302. Internalerror(2019092804);
  2303. current_procinfo.aktlocaldata.concat(tai_const.Create_type_sym(aitconst_tpoff,ref.symbol));
  2304. end
  2305. else if (cs_create_pic in current_settings.moduleswitches) then
  2306. if (tf_pic_uses_got in target_info.flags) then
  2307. current_procinfo.aktlocaldata.concat(tai_const.Create_type_sym(aitconst_got,ref.symbol))
  2308. else
  2309. begin
  2310. { ideally, we would want to generate
  2311. ldr r1, LPICConstPool
  2312. LPICLocal:
  2313. ldr/str r2,[pc,r1]
  2314. ...
  2315. LPICConstPool:
  2316. .long _globsym-(LPICLocal+8)
  2317. However, we cannot be sure that the ldr/str will follow
  2318. right after the call to fixref, so we have to load the
  2319. complete address already in a register.
  2320. }
  2321. current_asmdata.getaddrlabel(piclabel);
  2322. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_ptr,piclabel,ref.symbol,ref.offset-8));
  2323. end
  2324. else
  2325. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset))
  2326. end
  2327. else
  2328. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ref.offset));
  2329. { load consts entry }
  2330. if not indirection_done then
  2331. begin
  2332. tmpreg:=getintregister(list,OS_INT);
  2333. tmpref.symbol:=l;
  2334. tmpref.base:=NR_PC;
  2335. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2336. if (cs_create_pic in current_settings.moduleswitches) and
  2337. (tf_pic_uses_got in target_info.flags) and
  2338. assigned(ref.symbol) then
  2339. begin
  2340. {$ifdef EXTDEBUG}
  2341. if not (pi_needs_got in current_procinfo.flags) then
  2342. Comment(V_warning,'pi_needs_got not included');
  2343. {$endif EXTDEBUG}
  2344. Include(current_procinfo.flags,pi_needs_got);
  2345. reference_reset(tmpref,4,[]);
  2346. tmpref.base:=current_procinfo.got;
  2347. tmpref.index:=tmpreg;
  2348. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2349. if ref.offset<>0 then
  2350. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2351. end;
  2352. end;
  2353. if assigned(piclabel) then
  2354. begin
  2355. cg.a_label(list,piclabel);
  2356. tmpreg2:=getaddressregister(list);
  2357. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpreg,NR_PC,tmpreg2);
  2358. tmpreg:=tmpreg2
  2359. end;
  2360. { This routine can be called with PC as base/index in case the offset
  2361. was too large to encode in a load/store. In that case, the entire
  2362. absolute expression has been re-encoded in a new constpool entry, and
  2363. we have to remove the use of PC from the original reference (the code
  2364. above made everything relative to the value loaded from the new
  2365. constpool entry) }
  2366. if is_pc(ref.base) then
  2367. ref.base:=NR_NO;
  2368. if is_pc(ref.index) then
  2369. ref.index:=NR_NO;
  2370. if (ref.base<>NR_NO) then
  2371. begin
  2372. if ref.index<>NR_NO then
  2373. begin
  2374. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  2375. ref.base:=tmpreg;
  2376. end
  2377. else
  2378. if ref.base<>NR_PC then
  2379. begin
  2380. ref.index:=tmpreg;
  2381. ref.shiftimm:=0;
  2382. ref.signindex:=1;
  2383. ref.shiftmode:=SM_None;
  2384. end
  2385. else
  2386. ref.base:=tmpreg;
  2387. end
  2388. else
  2389. ref.base:=tmpreg;
  2390. ref.offset:=0;
  2391. ref.symbol:=nil;
  2392. end;
  2393. procedure tbasecgarm.g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  2394. var
  2395. paraloc1,paraloc2,paraloc3 : TCGPara;
  2396. pd : tprocdef;
  2397. begin
  2398. pd:=search_system_proc('MOVE');
  2399. paraloc1.init;
  2400. paraloc2.init;
  2401. paraloc3.init;
  2402. paramanager.getcgtempparaloc(list,pd,1,paraloc1);
  2403. paramanager.getcgtempparaloc(list,pd,2,paraloc2);
  2404. paramanager.getcgtempparaloc(list,pd,3,paraloc3);
  2405. a_load_const_cgpara(list,OS_SINT,len,paraloc3);
  2406. a_loadaddr_ref_cgpara(list,dest,paraloc2);
  2407. a_loadaddr_ref_cgpara(list,source,paraloc1);
  2408. paramanager.freecgpara(list,paraloc3);
  2409. paramanager.freecgpara(list,paraloc2);
  2410. paramanager.freecgpara(list,paraloc1);
  2411. alloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2412. alloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2413. a_call_name(list,'FPC_MOVE',false);
  2414. dealloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2415. dealloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2416. paraloc3.done;
  2417. paraloc2.done;
  2418. paraloc1.done;
  2419. end;
  2420. procedure tbasecgarm.g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  2421. const
  2422. maxtmpreg_arm = 10; {roozbeh: can be reduced to 8 or lower if might conflick with reserved ones,also +2 is used becouse of regs required for referencing}
  2423. maxtmpreg_thumb = 5;
  2424. var
  2425. srcref,dstref,usedtmpref,usedtmpref2:treference;
  2426. srcreg,destreg,countreg,r,tmpreg:tregister;
  2427. helpsize:aint;
  2428. copysize:byte;
  2429. cgsize:Tcgsize;
  2430. tmpregisters:array[1..maxtmpreg_arm] of tregister;
  2431. maxtmpreg,
  2432. tmpregi,tmpregi2:byte;
  2433. { will never be called with count<=4 }
  2434. procedure genloop(count : aword;size : byte);
  2435. const
  2436. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2437. var
  2438. l : tasmlabel;
  2439. begin
  2440. current_asmdata.getjumplabel(l);
  2441. if count<size then size:=1;
  2442. a_load_const_reg(list,OS_INT,count div size,countreg);
  2443. cg.a_label(list,l);
  2444. srcref.addressmode:=AM_POSTINDEXED;
  2445. dstref.addressmode:=AM_POSTINDEXED;
  2446. srcref.offset:=size;
  2447. dstref.offset:=size;
  2448. r:=getintregister(list,size2opsize[size]);
  2449. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2450. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2451. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1),PF_S));
  2452. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2453. a_jmp_flags(list,F_NE,l);
  2454. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2455. srcref.offset:=1;
  2456. dstref.offset:=1;
  2457. case count mod size of
  2458. 1:
  2459. begin
  2460. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2461. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2462. end;
  2463. 2:
  2464. if aligned then
  2465. begin
  2466. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2467. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2468. end
  2469. else
  2470. begin
  2471. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2472. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2473. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2474. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2475. end;
  2476. 3:
  2477. if aligned then
  2478. begin
  2479. srcref.offset:=2;
  2480. dstref.offset:=2;
  2481. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2482. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2483. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2484. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2485. end
  2486. else
  2487. begin
  2488. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2489. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2490. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2491. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2492. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2493. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2494. end;
  2495. end;
  2496. { keep the registers alive }
  2497. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2498. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2499. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2500. end;
  2501. { save estimation, if a creating a separate ref is needed or
  2502. if we can keep the original reference while copying }
  2503. function SimpleRef(const ref : treference) : boolean;
  2504. begin
  2505. result:=((ref.base=NR_PC) and (ref.addressmode=AM_OFFSET) and (ref.refaddr in [addr_full,addr_no])) or
  2506. ((ref.symbol=nil) and
  2507. (ref.addressmode=AM_OFFSET) and
  2508. (((ref.offset>=0) and (ref.offset+len<=31)) or
  2509. (not(GenerateThumbCode) and (ref.offset>=-255) and (ref.offset+len<=255)) or
  2510. { ldrh has a limited offset range }
  2511. (not(GenerateThumbCode) and ((len mod 4) in [0,1]) and (ref.offset>=-4095) and (ref.offset+len<=4095))
  2512. )
  2513. );
  2514. end;
  2515. { will never be called with count<=4 }
  2516. procedure genloop_thumb(count : aword;size : byte);
  2517. procedure refincofs(const ref : treference;const value : longint = 1);
  2518. begin
  2519. a_op_const_reg(list,OP_ADD,OS_ADDR,value,ref.base);
  2520. end;
  2521. const
  2522. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2523. var
  2524. l : tasmlabel;
  2525. begin
  2526. current_asmdata.getjumplabel(l);
  2527. if count<size then size:=1;
  2528. a_load_const_reg(list,OS_INT,count div size,countreg);
  2529. cg.a_label(list,l);
  2530. r:=getintregister(list,size2opsize[size]);
  2531. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2532. refincofs(srcref);
  2533. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2534. refincofs(dstref);
  2535. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2536. list.concat(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1));
  2537. a_jmp_flags(list,F_NE,l);
  2538. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2539. case count mod size of
  2540. 1:
  2541. begin
  2542. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2543. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2544. end;
  2545. 2:
  2546. if aligned then
  2547. begin
  2548. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2549. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2550. end
  2551. else
  2552. begin
  2553. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2554. refincofs(srcref);
  2555. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2556. refincofs(dstref);
  2557. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2558. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2559. end;
  2560. 3:
  2561. if aligned then
  2562. begin
  2563. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2564. refincofs(srcref,2);
  2565. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2566. refincofs(dstref,2);
  2567. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2568. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2569. end
  2570. else
  2571. begin
  2572. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2573. refincofs(srcref);
  2574. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2575. refincofs(dstref);
  2576. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2577. refincofs(srcref);
  2578. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2579. refincofs(dstref);
  2580. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2581. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2582. end;
  2583. end;
  2584. { keep the registers alive }
  2585. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2586. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2587. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2588. end;
  2589. begin
  2590. if len=0 then
  2591. exit;
  2592. if GenerateThumbCode then
  2593. maxtmpreg:=maxtmpreg_thumb
  2594. else
  2595. maxtmpreg:=maxtmpreg_arm;
  2596. helpsize:=12+maxtmpreg*4;//52 with maxtmpreg=10
  2597. dstref:=dest;
  2598. srcref:=source;
  2599. if cs_opt_size in current_settings.optimizerswitches then
  2600. helpsize:=8;
  2601. if aligned and (len=4) then
  2602. begin
  2603. tmpreg:=getintregister(list,OS_32);
  2604. a_load_ref_reg(list,OS_32,OS_32,source,tmpreg);
  2605. a_load_reg_ref(list,OS_32,OS_32,tmpreg,dest);
  2606. end
  2607. else if aligned and (len=2) then
  2608. begin
  2609. tmpreg:=getintregister(list,OS_16);
  2610. a_load_ref_reg(list,OS_16,OS_16,source,tmpreg);
  2611. a_load_reg_ref(list,OS_16,OS_16,tmpreg,dest);
  2612. end
  2613. else if (len<=helpsize) and aligned then
  2614. begin
  2615. tmpregi:=0;
  2616. { loading address in a separate register needed? }
  2617. if SimpleRef(source) then
  2618. begin
  2619. { ... then we don't need a loadaddr }
  2620. srcref:=source;
  2621. end
  2622. else
  2623. begin
  2624. srcreg:=getintregister(list,OS_ADDR);
  2625. a_loadaddr_ref_reg(list,source,srcreg);
  2626. reference_reset_base(srcref,srcreg,0,source.temppos,source.alignment,source.volatility);
  2627. end;
  2628. while (len div 4 <> 0) and (tmpregi<maxtmpreg) do
  2629. begin
  2630. inc(tmpregi);
  2631. tmpregisters[tmpregi]:=getintregister(list,OS_32);
  2632. a_load_ref_reg(list,OS_32,OS_32,srcref,tmpregisters[tmpregi]);
  2633. inc(srcref.offset,4);
  2634. dec(len,4);
  2635. end;
  2636. { loading address in a separate register needed? }
  2637. if SimpleRef(dest) then
  2638. dstref:=dest
  2639. else
  2640. begin
  2641. destreg:=getintregister(list,OS_ADDR);
  2642. a_loadaddr_ref_reg(list,dest,destreg);
  2643. reference_reset_base(dstref,destreg,0,dest.temppos,dest.alignment,dest.volatility);
  2644. end;
  2645. tmpregi2:=1;
  2646. while (tmpregi2<=tmpregi) do
  2647. begin
  2648. a_load_reg_ref(list,OS_32,OS_32,tmpregisters[tmpregi2],dstref);
  2649. inc(dstref.offset,4);
  2650. inc(tmpregi2);
  2651. end;
  2652. copysize:=4;
  2653. cgsize:=OS_32;
  2654. while len<>0 do
  2655. begin
  2656. if len<2 then
  2657. begin
  2658. copysize:=1;
  2659. cgsize:=OS_8;
  2660. end
  2661. else if len<4 then
  2662. begin
  2663. copysize:=2;
  2664. cgsize:=OS_16;
  2665. end;
  2666. dec(len,copysize);
  2667. r:=getintregister(list,cgsize);
  2668. a_load_ref_reg(list,cgsize,cgsize,srcref,r);
  2669. a_load_reg_ref(list,cgsize,cgsize,r,dstref);
  2670. inc(srcref.offset,copysize);
  2671. inc(dstref.offset,copysize);
  2672. end;{end of while}
  2673. end
  2674. else
  2675. begin
  2676. cgsize:=OS_32;
  2677. if (len<=4) then{len<=4 and not aligned}
  2678. begin
  2679. r:=getintregister(list,cgsize);
  2680. usedtmpref:=a_internal_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2681. if Len=1 then
  2682. a_load_reg_ref(list,OS_8,OS_8,r,dstref)
  2683. else
  2684. begin
  2685. tmpreg:=getintregister(list,cgsize);
  2686. usedtmpref2:=a_internal_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2687. inc(usedtmpref.offset,1);
  2688. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2689. inc(usedtmpref2.offset,1);
  2690. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2691. if len>2 then
  2692. begin
  2693. inc(usedtmpref.offset,1);
  2694. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2695. inc(usedtmpref2.offset,1);
  2696. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2697. if len>3 then
  2698. begin
  2699. inc(usedtmpref.offset,1);
  2700. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2701. inc(usedtmpref2.offset,1);
  2702. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2703. end;
  2704. end;
  2705. end;
  2706. end{end of if len<=4}
  2707. else
  2708. begin{unaligned & 4<len<helpsize **or** aligned/unaligned & len>helpsize}
  2709. destreg:=getintregister(list,OS_ADDR);
  2710. a_loadaddr_ref_reg(list,dest,destreg);
  2711. reference_reset_base(dstref,destreg,0,dest.temppos,dest.alignment,dest.volatility);
  2712. srcreg:=getintregister(list,OS_ADDR);
  2713. a_loadaddr_ref_reg(list,source,srcreg);
  2714. reference_reset_base(srcref,srcreg,0,dest.temppos,source.alignment,source.volatility);
  2715. countreg:=getintregister(list,OS_32);
  2716. // if cs_opt_size in current_settings.optimizerswitches then
  2717. { roozbeh : it seems loading 1 byte is faster becouse of caching/fetching(?) }
  2718. {if aligned then
  2719. genloop(len,4)
  2720. else}
  2721. if GenerateThumbCode then
  2722. genloop_thumb(len,1)
  2723. else
  2724. genloop(len,1);
  2725. end;
  2726. end;
  2727. end;
  2728. procedure tbasecgarm.g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);
  2729. begin
  2730. g_concatcopy_internal(list,source,dest,len,false);
  2731. end;
  2732. procedure tbasecgarm.g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);
  2733. begin
  2734. if (source.alignment in [1,3]) or
  2735. (dest.alignment in [1,3]) then
  2736. g_concatcopy_internal(list,source,dest,len,false)
  2737. else
  2738. g_concatcopy_internal(list,source,dest,len,true);
  2739. end;
  2740. procedure tbasecgarm.g_overflowCheck(list : TAsmList;const l : tlocation;def : tdef);
  2741. var
  2742. ovloc : tlocation;
  2743. begin
  2744. ovloc.loc:=LOC_VOID;
  2745. g_overflowCheck_loc(list,l,def,ovloc);
  2746. end;
  2747. procedure tbasecgarm.g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);
  2748. var
  2749. hl : tasmlabel;
  2750. ai:TAiCpu;
  2751. hflags : tresflags;
  2752. begin
  2753. if not(cs_check_overflow in current_settings.localswitches) then
  2754. exit;
  2755. current_asmdata.getjumplabel(hl);
  2756. case ovloc.loc of
  2757. LOC_VOID:
  2758. begin
  2759. ai:=taicpu.op_sym(A_B,hl);
  2760. ai.is_jmp:=true;
  2761. if not((def.typ=pointerdef) or
  2762. ((def.typ=orddef) and
  2763. (torddef(def).ordtype in [u64bit,u16bit,u32bit,u8bit,uchar,
  2764. pasbool1,pasbool8,pasbool16,pasbool32,pasbool64]))) then
  2765. ai.SetCondition(C_VC)
  2766. else
  2767. if TAiCpu(List.Last).opcode in [A_RSB,A_RSC,A_SBC,A_SUB] then
  2768. ai.SetCondition(C_CS)
  2769. else
  2770. ai.SetCondition(C_CC);
  2771. list.concat(ai);
  2772. end;
  2773. LOC_FLAGS:
  2774. begin
  2775. hflags:=ovloc.resflags;
  2776. inverse_flags(hflags);
  2777. cg.a_jmp_flags(list,hflags,hl);
  2778. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2779. end;
  2780. else
  2781. internalerror(200409281);
  2782. end;
  2783. a_call_name(list,'FPC_OVERFLOW',false);
  2784. a_label(list,hl);
  2785. end;
  2786. procedure tbasecgarm.g_save_registers(list : TAsmList);
  2787. begin
  2788. { this work is done in g_proc_entry }
  2789. end;
  2790. procedure tbasecgarm.g_restore_registers(list : TAsmList);
  2791. begin
  2792. { this work is done in g_proc_exit }
  2793. end;
  2794. procedure tbasecgarm.a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  2795. var
  2796. ai : taicpu;
  2797. hlabel : TAsmLabel;
  2798. begin
  2799. if GenerateThumbCode then
  2800. begin
  2801. { the optimizer has to fix this if jump range is sufficient short }
  2802. current_asmdata.getjumplabel(hlabel);
  2803. ai:=Taicpu.Op_sym(A_B,hlabel);
  2804. ai.SetCondition(inverse_cond(OpCmp2AsmCond[cond]));
  2805. ai.is_jmp:=true;
  2806. list.concat(ai);
  2807. a_jmp_always(list,l);
  2808. a_label(list,hlabel);
  2809. end
  2810. else
  2811. begin
  2812. ai:=Taicpu.Op_sym(A_B,l);
  2813. ai.SetCondition(OpCmp2AsmCond[cond]);
  2814. ai.is_jmp:=true;
  2815. list.concat(ai);
  2816. end;
  2817. end;
  2818. function get_scalar_mm_op(fromsize,tosize : tcgsize) : tasmop;
  2819. const
  2820. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of tasmop = (
  2821. (A_VMOV,A_VCVT,A_NONE,A_NONE,A_NONE),
  2822. (A_VCVT,A_VMOV,A_NONE,A_NONE,A_NONE),
  2823. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2824. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2825. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE));
  2826. begin
  2827. result:=convertop[fromsize,tosize];
  2828. if result=A_NONE then
  2829. internalerror(200312205);
  2830. end;
  2831. function get_scalar_mm_prefix(fromsize,tosize : tcgsize) : TOpPostfix;
  2832. const
  2833. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of TOpPostfix = (
  2834. (PF_F32, PF_F32F64,PF_None,PF_None,PF_None),
  2835. (PF_F64F32,PF_F64, PF_None,PF_None,PF_None),
  2836. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2837. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2838. (PF_None, PF_None, PF_None,PF_None,PF_None));
  2839. begin
  2840. result:=convertop[fromsize,tosize];
  2841. end;
  2842. procedure tbasecgarm.a_loadmm_reg_reg(list: tasmlist; fromsize,tosize: tcgsize; reg1,reg2: tregister; shuffle: pmmshuffle);
  2843. var
  2844. instr: taicpu;
  2845. begin
  2846. if (shuffle=nil) or shufflescalar(shuffle) then
  2847. instr:=setoppostfix(taicpu.op_reg_reg(get_scalar_mm_op(tosize,fromsize),reg2,reg1),get_scalar_mm_prefix(tosize,fromsize))
  2848. else
  2849. internalerror(2009112407);
  2850. list.concat(instr);
  2851. case instr.opcode of
  2852. A_VMOV:
  2853. { VMOV cannot generate an FPU exception, so we do not need a check here }
  2854. add_move_instruction(instr);
  2855. else
  2856. { VCVT can generate an exception }
  2857. maybe_check_for_fpu_exception(list);
  2858. end;
  2859. end;
  2860. procedure tbasecgarm.a_loadmm_ref_reg(list: tasmlist; fromsize,tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  2861. var
  2862. intreg,
  2863. tmpmmreg : tregister;
  2864. reg64 : tregister64;
  2865. begin
  2866. if assigned(shuffle) and
  2867. not(shufflescalar(shuffle)) then
  2868. internalerror(2009112413);
  2869. case fromsize of
  2870. OS_32,OS_S32:
  2871. begin
  2872. fromsize:=OS_F32;
  2873. { since we are loading an integer, no conversion may be required }
  2874. if (fromsize<>tosize) then
  2875. internalerror(2009112801);
  2876. end;
  2877. OS_64,OS_S64:
  2878. begin
  2879. fromsize:=OS_F64;
  2880. { since we are loading an integer, no conversion may be required }
  2881. if (fromsize<>tosize) then
  2882. internalerror(2009112901);
  2883. end;
  2884. OS_F32,OS_F64:
  2885. ;
  2886. else
  2887. internalerror(2019050920);
  2888. end;
  2889. if (fromsize<>tosize) then
  2890. tmpmmreg:=getmmregister(list,fromsize)
  2891. else
  2892. tmpmmreg:=reg;
  2893. if (ref.alignment in [1,2]) then
  2894. begin
  2895. case fromsize of
  2896. OS_F32:
  2897. begin
  2898. intreg:=getintregister(list,OS_32);
  2899. a_load_ref_reg(list,OS_32,OS_32,ref,intreg);
  2900. a_loadmm_intreg_reg(list,OS_32,OS_F32,intreg,tmpmmreg,mms_movescalar);
  2901. end;
  2902. OS_F64:
  2903. begin
  2904. reg64.reglo:=getintregister(list,OS_32);
  2905. reg64.reghi:=getintregister(list,OS_32);
  2906. cg64.a_load64_ref_reg(list,ref,reg64);
  2907. cg64.a_loadmm_intreg64_reg(list,OS_F64,reg64,tmpmmreg);
  2908. end;
  2909. else
  2910. internalerror(2009112412);
  2911. end;
  2912. end
  2913. else
  2914. handle_load_store(list,A_VLDR,PF_None,tmpmmreg,ref);
  2915. if (tmpmmreg<>reg) then
  2916. a_loadmm_reg_reg(list,fromsize,tosize,tmpmmreg,reg,shuffle);
  2917. end;
  2918. procedure tbasecgarm.a_loadmm_reg_ref(list: tasmlist; fromsize,tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  2919. var
  2920. intreg,
  2921. tmpmmreg : tregister;
  2922. reg64 : tregister64;
  2923. begin
  2924. if assigned(shuffle) and
  2925. not(shufflescalar(shuffle)) then
  2926. internalerror(2009112416);
  2927. case tosize of
  2928. OS_32,OS_S32:
  2929. begin
  2930. tosize:=OS_F32;
  2931. { since we are loading an integer, no conversion may be required }
  2932. if (fromsize<>tosize) then
  2933. internalerror(2009112802);
  2934. end;
  2935. OS_64,OS_S64:
  2936. begin
  2937. tosize:=OS_F64;
  2938. { since we are loading an integer, no conversion may be required }
  2939. if (fromsize<>tosize) then
  2940. internalerror(2009112902);
  2941. end;
  2942. OS_F32,OS_F64:
  2943. ;
  2944. else
  2945. internalerror(2019050919);
  2946. end;
  2947. if (fromsize<>tosize) then
  2948. begin
  2949. tmpmmreg:=getmmregister(list,tosize);
  2950. a_loadmm_reg_reg(list,fromsize,tosize,reg,tmpmmreg,shuffle);
  2951. end
  2952. else
  2953. tmpmmreg:=reg;
  2954. if (ref.alignment in [1,2]) then
  2955. begin
  2956. case tosize of
  2957. OS_F32:
  2958. begin
  2959. intreg:=getintregister(list,OS_32);
  2960. a_loadmm_reg_intreg(list,OS_F32,OS_32,tmpmmreg,intreg,shuffle);
  2961. a_load_reg_ref(list,OS_32,OS_32,intreg,ref);
  2962. end;
  2963. OS_F64:
  2964. begin
  2965. reg64.reglo:=getintregister(list,OS_32);
  2966. reg64.reghi:=getintregister(list,OS_32);
  2967. cg64.a_loadmm_reg_intreg64(list,OS_F64,tmpmmreg,reg64);
  2968. cg64.a_load64_reg_ref(list,reg64,ref);
  2969. end;
  2970. else
  2971. internalerror(2009112417);
  2972. end;
  2973. end
  2974. else
  2975. handle_load_store(list,A_VSTR,PF_None,tmpmmreg,ref);
  2976. { VSTR cannot generate an FPU exception, VCVT is handled seperately, so we do not need a check here }
  2977. end;
  2978. procedure tbasecgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  2979. begin
  2980. { this code can only be used to transfer raw data, not to perform
  2981. conversions }
  2982. if (tosize<>OS_F32) then
  2983. internalerror(2009112419);
  2984. if not(fromsize in [OS_32,OS_S32]) then
  2985. internalerror(2009112420);
  2986. if assigned(shuffle) and
  2987. not shufflescalar(shuffle) then
  2988. internalerror(2009112516);
  2989. list.concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg));
  2990. { VMOV cannot generate an FPU exception, so we do not need a check here }
  2991. end;
  2992. procedure tbasecgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize; mmreg, intreg: tregister;shuffle : pmmshuffle);
  2993. begin
  2994. { this code can only be used to transfer raw data, not to perform
  2995. conversions }
  2996. if (fromsize<>OS_F32) then
  2997. internalerror(2009112430);
  2998. if not(tosize in [OS_32,OS_S32]) then
  2999. internalerror(2009112409);
  3000. if assigned(shuffle) and
  3001. not shufflescalar(shuffle) then
  3002. internalerror(2009112514);
  3003. list.concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg));
  3004. { VMOV cannot generate an FPU exception, so we do not need a check here }
  3005. end;
  3006. procedure tbasecgarm.a_opmm_reg_reg(list: tasmlist; op: topcg; size: tcgsize; src, dst: tregister; shuffle: pmmshuffle);
  3007. var
  3008. tmpreg: tregister;
  3009. begin
  3010. { the vfp doesn't support xor nor any other logical operation, but
  3011. this routine is used to initialise global mm regvars. We can
  3012. easily initialise an mm reg with 0 though. }
  3013. case op of
  3014. OP_XOR:
  3015. begin
  3016. if (FPUARM_HAS_NEON in fpu_capabilities[current_settings.fputype]) and (size in [OS_F64]) then
  3017. begin
  3018. if (reg_cgsize(src)<>size) or
  3019. assigned(shuffle) then
  3020. internalerror(2019081301);
  3021. list.concat(taicpu.op_reg_reg_reg(A_VEOR,dst,dst,src));
  3022. end
  3023. else
  3024. begin
  3025. if (src<>dst) or
  3026. (reg_cgsize(src)<>size) or
  3027. assigned(shuffle) then
  3028. internalerror(2009112907);
  3029. tmpreg:=getintregister(list,OS_32);
  3030. a_load_const_reg(list,OS_32,0,tmpreg);
  3031. case size of
  3032. OS_F32:
  3033. list.concat(taicpu.op_reg_reg(A_VMOV,dst,tmpreg));
  3034. OS_F64:
  3035. list.concat(taicpu.op_reg_reg_reg(A_VMOV,dst,tmpreg,tmpreg));
  3036. else
  3037. internalerror(2009112908);
  3038. end;
  3039. end;
  3040. end
  3041. else
  3042. internalerror(2009112906);
  3043. end;
  3044. end;
  3045. procedure tbasecgarm.maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  3046. const
  3047. overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NEG];
  3048. begin
  3049. if (op in overflowops) and
  3050. (size in [OS_8,OS_S8,OS_16,OS_S16]) then
  3051. a_load_reg_reg(list,OS_32,size,dst,dst);
  3052. end;
  3053. procedure tbasecgarm.safe_mla(list : TAsmList; op1,op2,op3,op4 : TRegister);
  3054. procedure checkreg(var reg : TRegister);
  3055. var
  3056. tmpreg : TRegister;
  3057. begin
  3058. if ((GenerateThumbCode or GenerateThumb2Code) and (getsupreg(reg)=RS_R13)) or
  3059. (getsupreg(reg)=RS_R15) then
  3060. begin
  3061. tmpreg:=getintregister(list,OS_INT);
  3062. a_load_reg_reg(list,OS_INT,OS_INT,reg,tmpreg);
  3063. reg:=tmpreg;
  3064. end;
  3065. end;
  3066. begin
  3067. checkreg(op1);
  3068. checkreg(op2);
  3069. checkreg(op3);
  3070. checkreg(op4);
  3071. list.concat(taicpu.op_reg_reg_reg_reg(A_MLA,op1,op2,op3,op4));
  3072. end;
  3073. procedure tbasecgarm.g_maybe_tls_init(list : TAsmList);
  3074. begin
  3075. if pi_needs_tls in current_procinfo.flags then
  3076. begin
  3077. list.concat(tai_regalloc.alloc(NR_R0,nil));
  3078. a_call_name(list,'fpc_read_tp',false);
  3079. a_load_reg_reg(list,OS_ADDR,OS_ADDR,NR_R0,current_procinfo.tlsoffset);
  3080. list.concat(tai_regalloc.dealloc(NR_R0,nil));
  3081. end;
  3082. end;
  3083. procedure tcg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  3084. begin
  3085. case op of
  3086. OP_NEG:
  3087. begin
  3088. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3089. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  3090. list.concat(taicpu.op_reg_reg_const(A_RSC,regdst.reghi,regsrc.reghi,0));
  3091. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3092. end;
  3093. OP_NOT:
  3094. begin
  3095. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  3096. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  3097. end;
  3098. else
  3099. a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);
  3100. end;
  3101. end;
  3102. procedure tcg64farm.a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);
  3103. begin
  3104. a_op64_const_reg_reg(list,op,size,value,reg,reg);
  3105. end;
  3106. procedure tcg64farm.a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);
  3107. var
  3108. ovloc : tlocation;
  3109. begin
  3110. a_op64_const_reg_reg_checkoverflow(list,op,size,value,regsrc,regdst,false,ovloc);
  3111. end;
  3112. procedure tcg64farm.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);
  3113. var
  3114. ovloc : tlocation;
  3115. begin
  3116. a_op64_reg_reg_reg_checkoverflow(list,op,size,regsrc1,regsrc2,regdst,false,ovloc);
  3117. end;
  3118. procedure tcg64farm.a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);
  3119. begin
  3120. { this code can only be used to transfer raw data, not to perform
  3121. conversions }
  3122. if (mmsize<>OS_F64) then
  3123. internalerror(2009112405);
  3124. list.concat(taicpu.op_reg_reg_reg(A_VMOV,mmreg,intreg.reglo,intreg.reghi));
  3125. { VMOV cannot generate an FPU exception, so we do not need a check here }
  3126. end;
  3127. procedure tcg64farm.a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);
  3128. begin
  3129. { this code can only be used to transfer raw data, not to perform
  3130. conversions }
  3131. if (mmsize<>OS_F64) then
  3132. internalerror(2009112406);
  3133. list.concat(taicpu.op_reg_reg_reg(A_VMOV,intreg.reglo,intreg.reghi,mmreg));
  3134. { VMOV cannot generate an FPU exception, so we do not need a check here }
  3135. end;
  3136. procedure tcg64farm.a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3137. var
  3138. tmpreg : tregister;
  3139. b : byte;
  3140. begin
  3141. ovloc.loc:=LOC_VOID;
  3142. case op of
  3143. OP_NEG,
  3144. OP_NOT :
  3145. internalerror(2012022501);
  3146. else
  3147. ;
  3148. end;
  3149. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3150. begin
  3151. case op of
  3152. OP_ADD:
  3153. begin
  3154. if is_shifter_const(lo(value),b) then
  3155. begin
  3156. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3157. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3158. end
  3159. else
  3160. begin
  3161. tmpreg:=cg.getintregister(list,OS_32);
  3162. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3163. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3164. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3165. end;
  3166. if is_shifter_const(hi(value),b) then
  3167. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,hi(value)),PF_S))
  3168. else
  3169. begin
  3170. tmpreg:=cg.getintregister(list,OS_32);
  3171. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3172. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3173. end;
  3174. end;
  3175. OP_SUB:
  3176. begin
  3177. if is_shifter_const(lo(value),b) then
  3178. begin
  3179. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3180. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3181. end
  3182. else
  3183. begin
  3184. tmpreg:=cg.getintregister(list,OS_32);
  3185. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3186. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3187. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3188. end;
  3189. if is_shifter_const(hi(value),b) then
  3190. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))),PF_S))
  3191. else
  3192. begin
  3193. tmpreg:=cg.getintregister(list,OS_32);
  3194. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3195. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3196. end;
  3197. end;
  3198. else
  3199. internalerror(200502131);
  3200. end;
  3201. if size=OS_64 then
  3202. begin
  3203. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3204. ovloc.loc:=LOC_FLAGS;
  3205. case op of
  3206. OP_ADD:
  3207. ovloc.resflags:=F_CS;
  3208. OP_SUB:
  3209. ovloc.resflags:=F_CC;
  3210. else
  3211. internalerror(2019050918);
  3212. end;
  3213. end;
  3214. end
  3215. else
  3216. begin
  3217. case op of
  3218. OP_AND,OP_OR,OP_XOR:
  3219. begin
  3220. cg.a_op_const_reg_reg(list,op,OS_32,aint(lo(value)),regsrc.reglo,regdst.reglo);
  3221. cg.a_op_const_reg_reg(list,op,OS_32,aint(hi(value)),regsrc.reghi,regdst.reghi);
  3222. end;
  3223. OP_ADD:
  3224. begin
  3225. if is_shifter_const(aint(lo(value)),b) then
  3226. begin
  3227. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3228. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3229. end
  3230. else
  3231. begin
  3232. tmpreg:=cg.getintregister(list,OS_32);
  3233. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3234. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3235. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3236. end;
  3237. if is_shifter_const(aint(hi(value)),b) then
  3238. list.concat(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3239. else
  3240. begin
  3241. tmpreg:=cg.getintregister(list,OS_32);
  3242. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  3243. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg));
  3244. end;
  3245. end;
  3246. OP_SUB:
  3247. begin
  3248. if is_shifter_const(aint(lo(value)),b) then
  3249. begin
  3250. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3251. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3252. end
  3253. else
  3254. begin
  3255. tmpreg:=cg.getintregister(list,OS_32);
  3256. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3257. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3258. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3259. end;
  3260. if is_shifter_const(aint(hi(value)),b) then
  3261. list.concat(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3262. else
  3263. begin
  3264. tmpreg:=cg.getintregister(list,OS_32);
  3265. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3266. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg));
  3267. end;
  3268. end;
  3269. else
  3270. internalerror(2003083101);
  3271. end;
  3272. end;
  3273. end;
  3274. procedure tcg64farm.a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3275. begin
  3276. ovloc.loc:=LOC_VOID;
  3277. case op of
  3278. OP_NEG,
  3279. OP_NOT :
  3280. internalerror(2012022502);
  3281. else
  3282. ;
  3283. end;
  3284. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3285. begin
  3286. case op of
  3287. OP_ADD:
  3288. begin
  3289. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3290. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3291. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi),PF_S));
  3292. end;
  3293. OP_SUB:
  3294. begin
  3295. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3296. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3297. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi),PF_S));
  3298. end;
  3299. else
  3300. internalerror(2003083102);
  3301. end;
  3302. if size=OS_64 then
  3303. begin
  3304. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3305. ovloc.loc:=LOC_FLAGS;
  3306. case op of
  3307. OP_ADD:
  3308. ovloc.resflags:=F_CS;
  3309. OP_SUB:
  3310. ovloc.resflags:=F_CC;
  3311. else
  3312. internalerror(2019050917);
  3313. end;
  3314. end;
  3315. end
  3316. else
  3317. begin
  3318. case op of
  3319. OP_AND,OP_OR,OP_XOR:
  3320. begin
  3321. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);
  3322. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);
  3323. end;
  3324. OP_ADD:
  3325. begin
  3326. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3327. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3328. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi));
  3329. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3330. end;
  3331. OP_SUB:
  3332. begin
  3333. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3334. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3335. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi));
  3336. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3337. end;
  3338. else
  3339. internalerror(2003083104);
  3340. end;
  3341. end;
  3342. end;
  3343. procedure tthumbcgarm.init_register_allocators;
  3344. begin
  3345. inherited init_register_allocators;
  3346. if assigned(current_procinfo) and (current_procinfo.framepointer=NR_R7) then
  3347. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3348. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6],first_int_imreg,[])
  3349. else
  3350. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3351. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7],first_int_imreg,[]);
  3352. end;
  3353. procedure tthumbcgarm.done_register_allocators;
  3354. begin
  3355. rg[R_INTREGISTER].free;
  3356. rg[R_FPUREGISTER].free;
  3357. rg[R_MMREGISTER].free;
  3358. inherited done_register_allocators;
  3359. end;
  3360. procedure tthumbcgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  3361. var
  3362. ref : treference;
  3363. r : byte;
  3364. regs : tcpuregisterset;
  3365. stackmisalignment : pint;
  3366. registerarea: DWord;
  3367. stack_parameters: Boolean;
  3368. begin
  3369. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3370. LocalSize:=align(LocalSize,4);
  3371. { call instruction does not put anything on the stack }
  3372. stackmisalignment:=0;
  3373. if not(nostackframe) then
  3374. begin
  3375. a_reg_alloc(list,NR_STACK_POINTER_REG);
  3376. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3377. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  3378. { save int registers }
  3379. reference_reset(ref,4,[]);
  3380. ref.index:=NR_STACK_POINTER_REG;
  3381. ref.addressmode:=AM_PREINDEXED;
  3382. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3383. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3384. begin
  3385. //!!!! a_reg_alloc(list,NR_R12);
  3386. //!!!! list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  3387. end;
  3388. { the (old) ARM APCS requires saving both the stack pointer (to
  3389. crawl the stack) and the PC (to identify the function this
  3390. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  3391. and R15 -- still needs updating for EABI and Darwin, they don't
  3392. need that }
  3393. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3394. regs:=regs+[RS_R7,RS_R14]
  3395. else
  3396. // if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  3397. include(regs,RS_R14);
  3398. { safely estimate stack size }
  3399. if localsize+current_settings.alignment.localalignmax+4>508 then
  3400. begin
  3401. include(rg[R_INTREGISTER].used_in_proc,RS_R4);
  3402. include(regs,RS_R4);
  3403. end;
  3404. registerarea:=0;
  3405. if regs<>[] then
  3406. begin
  3407. for r:=RS_R0 to RS_R15 do
  3408. if r in regs then
  3409. inc(registerarea,4);
  3410. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,regs));
  3411. { we need to run the loop twice to get cfi right }
  3412. registerarea:=0;
  3413. for r:=RS_R0 to RS_R15 do
  3414. if r in regs then
  3415. begin
  3416. inc(registerarea,4);
  3417. current_asmdata.asmcfi.cfa_offset(list,newreg(R_INTREGISTER,r,R_SUBWHOLE),-registerarea);
  3418. end;
  3419. current_asmdata.asmcfi.cfa_def_cfa_offset(list,registerarea);
  3420. end;
  3421. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3422. if stack_parameters or (LocalSize<>0) or
  3423. ((stackmisalignment<>0) and
  3424. ((pi_do_call in current_procinfo.flags) or
  3425. (po_assembler in current_procinfo.procdef.procoptions))) then
  3426. begin
  3427. { do we access stack parameters?
  3428. if yes, the previously estimated stacksize must be used }
  3429. if stack_parameters then
  3430. begin
  3431. if localsize>tcpuprocinfo(current_procinfo).stackframesize then
  3432. begin
  3433. writeln(localsize);
  3434. writeln(tcpuprocinfo(current_procinfo).stackframesize);
  3435. internalerror(2013040601);
  3436. end
  3437. else
  3438. localsize:=tcpuprocinfo(current_procinfo).stackframesize-registerarea;
  3439. end
  3440. else
  3441. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3442. if localsize<508 then
  3443. begin
  3444. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  3445. end
  3446. else if localsize<=1016 then
  3447. begin
  3448. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3449. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize-508));
  3450. end
  3451. else
  3452. begin
  3453. a_load_const_reg(list,OS_ADDR,-localsize,NR_R4);
  3454. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R4));
  3455. include(regs,RS_R4);
  3456. end;
  3457. current_asmdata.asmcfi.cfa_def_cfa_offset(list,registerarea+localsize);
  3458. end;
  3459. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3460. begin
  3461. list.concat(taicpu.op_reg_reg_const(A_ADD,current_procinfo.framepointer,NR_STACK_POINTER_REG,0));
  3462. current_asmdata.asmcfi.cfa_def_cfa_register(list,current_procinfo.framepointer);
  3463. end;
  3464. end;
  3465. end;
  3466. procedure tthumbcgarm.g_proc_exit(list: TAsmList; parasize: longint; nostackframe: boolean);
  3467. var
  3468. LocalSize : longint;
  3469. r: byte;
  3470. regs : tcpuregisterset;
  3471. registerarea : DWord;
  3472. stackmisalignment: pint;
  3473. stack_parameters : Boolean;
  3474. begin
  3475. if not(nostackframe) then
  3476. begin
  3477. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3478. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3479. include(regs,RS_R15);
  3480. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3481. include(regs,getsupreg(current_procinfo.framepointer));
  3482. registerarea:=0;
  3483. for r:=RS_R0 to RS_R15 do
  3484. if r in regs then
  3485. inc(registerarea,4);
  3486. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3487. LocalSize:=current_procinfo.calc_stackframe_size;
  3488. if stack_parameters then
  3489. localsize:=tcpuprocinfo(current_procinfo).stackframesize-registerarea
  3490. else
  3491. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3492. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  3493. (target_info.system in systems_darwin) then
  3494. begin
  3495. if (LocalSize<>0) or
  3496. ((stackmisalignment<>0) and
  3497. ((pi_do_call in current_procinfo.flags) or
  3498. (po_assembler in current_procinfo.procdef.procoptions))) then
  3499. begin
  3500. if LocalSize=0 then
  3501. else if LocalSize<=508 then
  3502. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  3503. else if LocalSize<=1016 then
  3504. begin
  3505. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3506. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,localsize-508));
  3507. end
  3508. else
  3509. begin
  3510. a_reg_alloc(list,NR_R3);
  3511. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R3);
  3512. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R3));
  3513. a_reg_dealloc(list,NR_R3);
  3514. end;
  3515. end;
  3516. if regs=[] then
  3517. begin
  3518. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3519. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3520. else
  3521. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3522. end
  3523. else
  3524. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,regs));
  3525. end;
  3526. end
  3527. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3528. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3529. else
  3530. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3531. end;
  3532. procedure tthumbcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3533. var
  3534. oppostfix:toppostfix;
  3535. usedtmpref: treference;
  3536. tmpreg,tmpreg2 : tregister;
  3537. dir : integer;
  3538. begin
  3539. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3540. FromSize := ToSize;
  3541. case FromSize of
  3542. { signed integer registers }
  3543. OS_8:
  3544. oppostfix:=PF_B;
  3545. OS_S8:
  3546. oppostfix:=PF_SB;
  3547. OS_16:
  3548. oppostfix:=PF_H;
  3549. OS_S16:
  3550. oppostfix:=PF_SH;
  3551. OS_32,
  3552. OS_S32:
  3553. oppostfix:=PF_None;
  3554. else
  3555. InternalError(200308298);
  3556. end;
  3557. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3558. begin
  3559. if target_info.endian=endian_big then
  3560. dir:=-1
  3561. else
  3562. dir:=1;
  3563. case FromSize of
  3564. OS_16,OS_S16:
  3565. begin
  3566. { only complicated references need an extra loadaddr }
  3567. if assigned(ref.symbol) or
  3568. (ref.index<>NR_NO) or
  3569. (ref.offset<-124) or
  3570. (ref.offset>124) or
  3571. { sometimes the compiler reused registers }
  3572. (reg=ref.index) or
  3573. (reg=ref.base) then
  3574. begin
  3575. tmpreg2:=getintregister(list,OS_INT);
  3576. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3577. reference_reset_base(usedtmpref,tmpreg2,0,ref.temppos,ref.alignment,ref.volatility);
  3578. end
  3579. else
  3580. usedtmpref:=ref;
  3581. if target_info.endian=endian_big then
  3582. inc(usedtmpref.offset,1);
  3583. tmpreg:=getintregister(list,OS_INT);
  3584. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3585. inc(usedtmpref.offset,dir);
  3586. if FromSize=OS_16 then
  3587. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3588. else
  3589. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3590. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3591. list.concat(setoppostfix(taicpu.op_reg_reg(A_ORR,reg,tmpreg),PF_S));
  3592. end;
  3593. OS_32,OS_S32:
  3594. begin
  3595. tmpreg:=getintregister(list,OS_INT);
  3596. { only complicated references need an extra loadaddr }
  3597. if assigned(ref.symbol) or
  3598. (ref.index<>NR_NO) or
  3599. (ref.offset<-124) or
  3600. (ref.offset>124) or
  3601. { sometimes the compiler reused registers }
  3602. (reg=ref.index) or
  3603. (reg=ref.base) then
  3604. begin
  3605. tmpreg2:=getintregister(list,OS_INT);
  3606. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3607. reference_reset_base(usedtmpref,tmpreg2,0,ref.temppos,ref.alignment,ref.volatility);
  3608. end
  3609. else
  3610. usedtmpref:=ref;
  3611. if ref.alignment=2 then
  3612. begin
  3613. if target_info.endian=endian_big then
  3614. inc(usedtmpref.offset,2);
  3615. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  3616. inc(usedtmpref.offset,dir*2);
  3617. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  3618. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3619. list.concat(setoppostfix(taicpu.op_reg_reg(A_ORR,reg,tmpreg),PF_S));
  3620. end
  3621. else
  3622. begin
  3623. if target_info.endian=endian_big then
  3624. inc(usedtmpref.offset,3);
  3625. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3626. inc(usedtmpref.offset,dir);
  3627. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3628. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3629. list.concat(setoppostfix(taicpu.op_reg_reg(A_ORR,reg,tmpreg),PF_S));
  3630. inc(usedtmpref.offset,dir);
  3631. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3632. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3633. list.concat(setoppostfix(taicpu.op_reg_reg(A_ORR,reg,tmpreg),PF_S));
  3634. inc(usedtmpref.offset,dir);
  3635. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3636. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,24));
  3637. list.concat(setoppostfix(taicpu.op_reg_reg(A_ORR,reg,tmpreg),PF_S));
  3638. end;
  3639. end
  3640. else
  3641. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3642. end;
  3643. end
  3644. else
  3645. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3646. if (fromsize=OS_S8) and (tosize = OS_16) then
  3647. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  3648. end;
  3649. procedure tthumbcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3650. var
  3651. l : tasmlabel;
  3652. hr : treference;
  3653. begin
  3654. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3655. internalerror(2002090908);
  3656. if is_thumb_imm(a) then
  3657. list.concat(setoppostfix(taicpu.op_reg_const(A_MOV,reg,a),PF_S))
  3658. else
  3659. begin
  3660. reference_reset(hr,4,[]);
  3661. current_asmdata.getjumplabel(l);
  3662. cg.a_label(current_procinfo.aktlocaldata,l);
  3663. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3664. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3665. hr.symbol:=l;
  3666. hr.base:=NR_PC;
  3667. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3668. end;
  3669. end;
  3670. procedure tthumbcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  3671. var
  3672. hsym : tsym;
  3673. href,
  3674. tmpref : treference;
  3675. paraloc : Pcgparalocation;
  3676. l : TAsmLabel;
  3677. begin
  3678. { calculate the parameter info for the procdef }
  3679. procdef.init_paraloc_info(callerside);
  3680. hsym:=tsym(procdef.parast.Find('self'));
  3681. if not(assigned(hsym) and
  3682. (hsym.typ=paravarsym)) then
  3683. internalerror(2003052504);
  3684. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  3685. while paraloc<>nil do
  3686. with paraloc^ do
  3687. begin
  3688. case loc of
  3689. LOC_REGISTER:
  3690. begin
  3691. if is_thumb_imm(ioffset) then
  3692. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  3693. else
  3694. begin
  3695. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3696. reference_reset(tmpref,4,[]);
  3697. current_asmdata.getjumplabel(l);
  3698. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3699. cg.a_label(current_procinfo.aktlocaldata,l);
  3700. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3701. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3702. tmpref.symbol:=l;
  3703. tmpref.base:=NR_PC;
  3704. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3705. a_op_reg_reg(list,OP_SUB,size,NR_R4,register);
  3706. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3707. end;
  3708. end;
  3709. LOC_REFERENCE:
  3710. begin
  3711. { offset in the wrapper needs to be adjusted for the stored
  3712. return address }
  3713. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),ctempposinvalid,sizeof(pint),[]);
  3714. if is_thumb_imm(ioffset) then
  3715. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  3716. else
  3717. begin
  3718. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3719. reference_reset(tmpref,4,[]);
  3720. current_asmdata.getjumplabel(l);
  3721. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3722. cg.a_label(current_procinfo.aktlocaldata,l);
  3723. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3724. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3725. tmpref.symbol:=l;
  3726. tmpref.base:=NR_PC;
  3727. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3728. a_op_reg_ref(list,OP_SUB,size,NR_R4,href);
  3729. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3730. end;
  3731. end
  3732. else
  3733. internalerror(2003091804);
  3734. end;
  3735. paraloc:=next;
  3736. end;
  3737. end;
  3738. function tthumbcgarm.handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference;
  3739. var
  3740. href : treference;
  3741. tmpreg : TRegister;
  3742. begin
  3743. href:=ref;
  3744. if { LDR/STR limitations }
  3745. (
  3746. (((op=A_LDR) and (oppostfix=PF_None)) or
  3747. ((op=A_STR) and (oppostfix=PF_None))) and
  3748. (ref.base<>NR_STACK_POINTER_REG) and
  3749. (abs(ref.offset)>124)
  3750. ) or
  3751. { LDRB/STRB limitations }
  3752. (
  3753. (((op=A_LDR) and (oppostfix=PF_B)) or
  3754. ((op=A_LDRB) and (oppostfix=PF_None)) or
  3755. ((op=A_STR) and (oppostfix=PF_B)) or
  3756. ((op=A_STRB) and (oppostfix=PF_None))) and
  3757. ((ref.base=NR_STACK_POINTER_REG) or
  3758. (ref.index=NR_STACK_POINTER_REG) or
  3759. (abs(ref.offset)>31)
  3760. )
  3761. ) or
  3762. { LDRH/STRH limitations }
  3763. (
  3764. (((op=A_LDR) and (oppostfix=PF_H)) or
  3765. ((op=A_LDRH) and (oppostfix=PF_None)) or
  3766. ((op=A_STR) and (oppostfix=PF_H)) or
  3767. ((op=A_STRH) and (oppostfix=PF_None))) and
  3768. ((ref.base=NR_STACK_POINTER_REG) or
  3769. (ref.index=NR_STACK_POINTER_REG) or
  3770. (abs(ref.offset)>62) or
  3771. ((abs(ref.offset) mod 2)<>0)
  3772. )
  3773. ) then
  3774. begin
  3775. tmpreg:=getintregister(list,OS_ADDR);
  3776. a_loadaddr_ref_reg(list,ref,tmpreg);
  3777. reference_reset_base(href,tmpreg,0,ref.temppos,ref.alignment,ref.volatility);
  3778. end
  3779. else if (op=A_LDR) and
  3780. (oppostfix in [PF_None]) and
  3781. (ref.base=NR_STACK_POINTER_REG) and
  3782. (abs(ref.offset)>1020) then
  3783. begin
  3784. tmpreg:=getintregister(list,OS_ADDR);
  3785. a_loadaddr_ref_reg(list,ref,tmpreg);
  3786. reference_reset_base(href,tmpreg,0,ref.temppos,ref.alignment,ref.volatility);
  3787. end
  3788. else if (op=A_LDR) and
  3789. ((oppostfix in [PF_SH,PF_SB]) or
  3790. (abs(ref.offset)>124)) then
  3791. begin
  3792. tmpreg:=getintregister(list,OS_ADDR);
  3793. a_loadaddr_ref_reg(list,ref,tmpreg);
  3794. reference_reset_base(href,tmpreg,0,ref.temppos,ref.alignment,ref.volatility);
  3795. end;
  3796. Result:=inherited handle_load_store(list, op, oppostfix, reg, href);
  3797. end;
  3798. procedure tthumbcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  3799. var
  3800. tmpreg : tregister;
  3801. begin
  3802. case op of
  3803. OP_NEG:
  3804. list.concat(taicpu.op_reg_reg(A_NEG,dst,src));
  3805. OP_NOT:
  3806. list.concat(setoppostfix(taicpu.op_reg_reg(A_MVN,dst,src),PF_S));
  3807. OP_DIV,OP_IDIV:
  3808. internalerror(200308284);
  3809. OP_ROL:
  3810. begin
  3811. if not(size in [OS_32,OS_S32]) then
  3812. internalerror(2008072805);
  3813. { simulate ROL by ror'ing 32-value }
  3814. tmpreg:=getintregister(list,OS_32);
  3815. a_load_const_reg(list,OS_32,32,tmpreg);
  3816. list.concat(taicpu.op_reg_reg(A_SUB,tmpreg,src));
  3817. list.concat(setoppostfix(taicpu.op_reg_reg(A_ROR,dst,src),PF_S));
  3818. end;
  3819. else
  3820. begin
  3821. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3822. list.concat(setoppostfix(
  3823. taicpu.op_reg_reg(op_reg_opcg2asmop[op],dst,src),op_reg_postfix_thumb[op]));
  3824. end;
  3825. end;
  3826. maybeadjustresult(list,op,size,dst);
  3827. end;
  3828. procedure tthumbcgarm.a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);
  3829. var
  3830. tmpreg : tregister;
  3831. {$ifdef DUMMY}
  3832. l1 : longint;
  3833. {$endif DUMMY}
  3834. begin
  3835. //!!! ovloc.loc:=LOC_VOID;
  3836. if {$ifopt R+}(a<>-2147483648) and{$endif} {!!!!!! not setflags and } is_thumb_imm(-a) then
  3837. case op of
  3838. OP_ADD:
  3839. begin
  3840. op:=OP_SUB;
  3841. a:=aint(dword(-a));
  3842. end;
  3843. OP_SUB:
  3844. begin
  3845. op:=OP_ADD;
  3846. a:=aint(dword(-a));
  3847. end
  3848. else
  3849. ;
  3850. end;
  3851. if is_thumb_imm(a) and (op in [OP_ADD,OP_SUB]) then
  3852. begin
  3853. // if cgsetflags or setflags then
  3854. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3855. list.concat(setoppostfix(
  3856. taicpu.op_reg_const(op_reg_opcg2asmop[op],dst,a),op_reg_postfix_thumb[op]));
  3857. if (cgsetflags {!!! or setflags }) and (size in [OS_8,OS_16,OS_32]) then
  3858. begin
  3859. //!!! ovloc.loc:=LOC_FLAGS;
  3860. case op of
  3861. OP_ADD:
  3862. //!!! ovloc.resflags:=F_CS;
  3863. ;
  3864. OP_SUB:
  3865. //!!! ovloc.resflags:=F_CC;
  3866. ;
  3867. else
  3868. ;
  3869. end;
  3870. end;
  3871. end
  3872. else
  3873. begin
  3874. { there could be added some more sophisticated optimizations }
  3875. if (op in [OP_MUL,OP_IMUL,OP_DIV,OP_IDIV]) and (a=1) then
  3876. a_load_reg_reg(list,size,size,dst,dst)
  3877. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  3878. a_load_const_reg(list,size,0,dst)
  3879. else if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  3880. a_op_reg_reg(list,OP_NEG,size,dst,dst)
  3881. { we do this here instead in the peephole optimizer because
  3882. it saves us a register }
  3883. {$ifdef DUMMY}
  3884. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  3885. a_op_const_reg_reg(list,OP_SHL,size,l1,dst,dst)
  3886. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  3887. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  3888. begin
  3889. if l1>32 then{roozbeh does this ever happen?}
  3890. internalerror(2003082903);
  3891. shifterop_reset(so);
  3892. so.shiftmode:=SM_LSL;
  3893. so.shiftimm:=l1;
  3894. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,dst,so));
  3895. end
  3896. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  3897. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  3898. begin
  3899. if l1>32 then{does this ever happen?}
  3900. internalerror(2012051802);
  3901. shifterop_reset(so);
  3902. so.shiftmode:=SM_LSL;
  3903. so.shiftimm:=l1;
  3904. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,dst,dst,so));
  3905. end
  3906. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,dst,dst) then
  3907. begin
  3908. { nothing to do on success }
  3909. end
  3910. {$endif DUMMY}
  3911. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  3912. Just using mov x, #0 might allow some easier optimizations down the line. }
  3913. else if (op = OP_AND) and (dword(a)=0) then
  3914. list.concat(setoppostfix(taicpu.op_reg_const(A_MOV,dst,0),PF_S))
  3915. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  3916. else if (op = OP_AND) and (not(dword(a))=0) then
  3917. // do nothing
  3918. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  3919. broader range of shifterconstants.}
  3920. {$ifdef DUMMY}
  3921. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  3922. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,not(dword(a))))
  3923. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  3924. begin
  3925. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm1));
  3926. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  3927. end
  3928. else if (op in [OP_ADD, OP_SUB, OP_OR]) and
  3929. not(cgsetflags or setflags) and
  3930. split_into_shifter_const(a, imm1, imm2) then
  3931. begin
  3932. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm1));
  3933. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  3934. end
  3935. {$endif DUMMY}
  3936. else if (op in [OP_SHL, OP_SHR, OP_SAR]) then
  3937. begin
  3938. list.concat(taicpu.op_reg_reg_const(op_reg_opcg2asmop[op],dst,dst,a));
  3939. end
  3940. else
  3941. begin
  3942. tmpreg:=getintregister(list,size);
  3943. a_load_const_reg(list,size,a,tmpreg);
  3944. a_op_reg_reg(list,op,size,tmpreg,dst);
  3945. end;
  3946. end;
  3947. maybeadjustresult(list,op,size,dst);
  3948. end;
  3949. procedure tthumbcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister);
  3950. begin
  3951. if (op=OP_ADD) and (src=NR_R13) and (dst<>NR_R13) and ((a mod 4)=0) and (a>0) and (a<=1020) then
  3952. list.concat(taicpu.op_reg_reg_const(A_ADD,dst,src,a))
  3953. else
  3954. inherited a_op_const_reg_reg(list,op,size,a,src,dst);
  3955. end;
  3956. procedure tthumbcgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  3957. var
  3958. l1,l2 : tasmlabel;
  3959. ai : taicpu;
  3960. begin
  3961. current_asmdata.getjumplabel(l1);
  3962. current_asmdata.getjumplabel(l2);
  3963. ai:=setcondition(taicpu.op_sym(A_B,l1),flags_to_cond(f));
  3964. ai.is_jmp:=true;
  3965. list.concat(ai);
  3966. list.concat(setoppostfix(taicpu.op_reg_const(A_MOV,reg,0),PF_S));
  3967. list.concat(taicpu.op_sym(A_B,l2));
  3968. cg.a_label(list,l1);
  3969. list.concat(setoppostfix(taicpu.op_reg_const(A_MOV,reg,1),PF_S));
  3970. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3971. cg.a_label(list,l2);
  3972. end;
  3973. procedure tthumb2cgarm.init_register_allocators;
  3974. begin
  3975. inherited init_register_allocators;
  3976. { currently, we save R14 always, so we can use it }
  3977. if (target_info.system<>system_arm_ios) then
  3978. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3979. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3980. RS_R9,RS_R10,RS_R12,RS_R14],first_int_imreg,[])
  3981. else
  3982. { r9 is not available on Darwin according to the llvm code generator }
  3983. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3984. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3985. RS_R10,RS_R12,RS_R14],first_int_imreg,[]);
  3986. if FPUARM_HAS_FPA in fpu_capabilities[current_settings.fputype] then
  3987. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  3988. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  3989. init_mmregister_allocator;
  3990. end;
  3991. procedure tthumb2cgarm.done_register_allocators;
  3992. begin
  3993. rg[R_INTREGISTER].free;
  3994. rg[R_FPUREGISTER].free;
  3995. rg[R_MMREGISTER].free;
  3996. inherited done_register_allocators;
  3997. end;
  3998. procedure tthumb2cgarm.a_call_reg(list : TAsmList;reg: tregister);
  3999. begin
  4000. list.concat(taicpu.op_reg(A_BLX, reg));
  4001. {
  4002. the compiler does not properly set this flag anymore in pass 1, and
  4003. for now we only need it after pass 2 (I hope) (JM)
  4004. if not(pi_do_call in current_procinfo.flags) then
  4005. internalerror(2003060703);
  4006. }
  4007. include(current_procinfo.flags,pi_do_call);
  4008. end;
  4009. procedure tthumb2cgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  4010. var
  4011. l : tasmlabel;
  4012. hr : treference;
  4013. begin
  4014. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  4015. internalerror(2002090909);
  4016. if is_thumb32_imm(a) then
  4017. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  4018. else if is_thumb32_imm(not(a)) then
  4019. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  4020. else if (a and $FFFF)=a then
  4021. list.concat(taicpu.op_reg_const(A_MOVW,reg,a))
  4022. else
  4023. begin
  4024. reference_reset(hr,4,[]);
  4025. current_asmdata.getjumplabel(l);
  4026. cg.a_label(current_procinfo.aktlocaldata,l);
  4027. hr.symboldata:=current_procinfo.aktlocaldata.last;
  4028. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  4029. hr.symbol:=l;
  4030. hr.base:=NR_PC;
  4031. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  4032. end;
  4033. end;
  4034. procedure tthumb2cgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  4035. var
  4036. oppostfix:toppostfix;
  4037. usedtmpref: treference;
  4038. tmpreg,tmpreg2 : tregister;
  4039. so : tshifterop;
  4040. dir : integer;
  4041. begin
  4042. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  4043. FromSize := ToSize;
  4044. case FromSize of
  4045. { signed integer registers }
  4046. OS_8:
  4047. oppostfix:=PF_B;
  4048. OS_S8:
  4049. oppostfix:=PF_SB;
  4050. OS_16:
  4051. oppostfix:=PF_H;
  4052. OS_S16:
  4053. oppostfix:=PF_SH;
  4054. OS_32,
  4055. OS_S32:
  4056. oppostfix:=PF_None;
  4057. else
  4058. InternalError(2003082913);
  4059. end;
  4060. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  4061. begin
  4062. if target_info.endian=endian_big then
  4063. dir:=-1
  4064. else
  4065. dir:=1;
  4066. case FromSize of
  4067. OS_16,OS_S16:
  4068. begin
  4069. { only complicated references need an extra loadaddr }
  4070. if assigned(ref.symbol) or
  4071. (ref.index<>NR_NO) or
  4072. (ref.offset<-255) or
  4073. (ref.offset>4094) or
  4074. { sometimes the compiler reused registers }
  4075. (reg=ref.index) or
  4076. (reg=ref.base) then
  4077. begin
  4078. tmpreg2:=getintregister(list,OS_INT);
  4079. a_loadaddr_ref_reg(list,ref,tmpreg2);
  4080. reference_reset_base(usedtmpref,tmpreg2,0,ref.temppos,ref.alignment,ref.volatility);
  4081. end
  4082. else
  4083. usedtmpref:=ref;
  4084. if target_info.endian=endian_big then
  4085. inc(usedtmpref.offset,1);
  4086. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  4087. tmpreg:=getintregister(list,OS_INT);
  4088. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  4089. inc(usedtmpref.offset,dir);
  4090. if FromSize=OS_16 then
  4091. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  4092. else
  4093. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  4094. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4095. end;
  4096. OS_32,OS_S32:
  4097. begin
  4098. tmpreg:=getintregister(list,OS_INT);
  4099. { only complicated references need an extra loadaddr }
  4100. if assigned(ref.symbol) or
  4101. (ref.index<>NR_NO) or
  4102. (ref.offset<-255) or
  4103. (ref.offset>4092) or
  4104. { sometimes the compiler reused registers }
  4105. (reg=ref.index) or
  4106. (reg=ref.base) then
  4107. begin
  4108. tmpreg2:=getintregister(list,OS_INT);
  4109. a_loadaddr_ref_reg(list,ref,tmpreg2);
  4110. reference_reset_base(usedtmpref,tmpreg2,0,ref.temppos,ref.alignment,ref.volatility);
  4111. end
  4112. else
  4113. usedtmpref:=ref;
  4114. shifterop_reset(so);so.shiftmode:=SM_LSL;
  4115. if ref.alignment=2 then
  4116. begin
  4117. if target_info.endian=endian_big then
  4118. inc(usedtmpref.offset,2);
  4119. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  4120. inc(usedtmpref.offset,dir*2);
  4121. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  4122. so.shiftimm:=16;
  4123. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4124. end
  4125. else
  4126. begin
  4127. if target_info.endian=endian_big then
  4128. inc(usedtmpref.offset,3);
  4129. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  4130. inc(usedtmpref.offset,dir);
  4131. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4132. so.shiftimm:=8;
  4133. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4134. inc(usedtmpref.offset,dir);
  4135. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4136. so.shiftimm:=16;
  4137. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4138. inc(usedtmpref.offset,dir);
  4139. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4140. so.shiftimm:=24;
  4141. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4142. end;
  4143. end
  4144. else
  4145. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4146. end;
  4147. end
  4148. else
  4149. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4150. if (fromsize=OS_S8) and (tosize = OS_16) then
  4151. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  4152. end;
  4153. procedure tthumb2cgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  4154. begin
  4155. if op = OP_NOT then
  4156. begin
  4157. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  4158. case size of
  4159. OS_8: list.concat(taicpu.op_reg_reg(A_UXTB,dst,dst));
  4160. OS_S8: list.concat(taicpu.op_reg_reg(A_SXTB,dst,dst));
  4161. OS_16: list.concat(taicpu.op_reg_reg(A_UXTH,dst,dst));
  4162. OS_S16: list.concat(taicpu.op_reg_reg(A_SXTH,dst,dst));
  4163. OS_32,
  4164. OS_S32:
  4165. ;
  4166. else
  4167. internalerror(2019050916);
  4168. end;
  4169. end
  4170. else
  4171. inherited a_op_reg_reg(list, op, size, src, dst);
  4172. end;
  4173. procedure tthumb2cgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4174. var
  4175. shift, width : byte;
  4176. tmpreg : tregister;
  4177. so : tshifterop;
  4178. l1 : longint;
  4179. begin
  4180. ovloc.loc:=LOC_VOID;
  4181. if (a<>-2147483648) and is_shifter_const(-a,shift) then
  4182. case op of
  4183. OP_ADD:
  4184. begin
  4185. op:=OP_SUB;
  4186. a:=aint(dword(-a));
  4187. end;
  4188. OP_SUB:
  4189. begin
  4190. op:=OP_ADD;
  4191. a:=aint(dword(-a));
  4192. end
  4193. else
  4194. ;
  4195. end;
  4196. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  4197. case op of
  4198. OP_NEG,OP_NOT,
  4199. OP_DIV,OP_IDIV:
  4200. internalerror(200308285);
  4201. OP_SHL:
  4202. begin
  4203. if a>32 then
  4204. internalerror(2014020703);
  4205. if a<>0 then
  4206. begin
  4207. shifterop_reset(so);
  4208. so.shiftmode:=SM_LSL;
  4209. so.shiftimm:=a;
  4210. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4211. end
  4212. else
  4213. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4214. end;
  4215. OP_ROL:
  4216. begin
  4217. if a>32 then
  4218. internalerror(2014020704);
  4219. if a<>0 then
  4220. begin
  4221. shifterop_reset(so);
  4222. so.shiftmode:=SM_ROR;
  4223. so.shiftimm:=32-a;
  4224. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4225. end
  4226. else
  4227. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4228. end;
  4229. OP_ROR:
  4230. begin
  4231. if a>32 then
  4232. internalerror(2014020705);
  4233. if a<>0 then
  4234. begin
  4235. shifterop_reset(so);
  4236. so.shiftmode:=SM_ROR;
  4237. so.shiftimm:=a;
  4238. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4239. end
  4240. else
  4241. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4242. end;
  4243. OP_SHR:
  4244. begin
  4245. if a>32 then
  4246. internalerror(200308292);
  4247. shifterop_reset(so);
  4248. if a<>0 then
  4249. begin
  4250. so.shiftmode:=SM_LSR;
  4251. so.shiftimm:=a;
  4252. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4253. end
  4254. else
  4255. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4256. end;
  4257. OP_SAR:
  4258. begin
  4259. if a>32 then
  4260. internalerror(200308295);
  4261. if a<>0 then
  4262. begin
  4263. shifterop_reset(so);
  4264. so.shiftmode:=SM_ASR;
  4265. so.shiftimm:=a;
  4266. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4267. end
  4268. else
  4269. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4270. end;
  4271. else
  4272. if (op in [OP_SUB, OP_ADD]) and
  4273. ((a < 0) or
  4274. (a > 4095)) then
  4275. begin
  4276. tmpreg:=getintregister(list,size);
  4277. a_load_const_reg(list, size, a, tmpreg);
  4278. if cgsetflags or setflags then
  4279. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4280. list.concat(setoppostfix(
  4281. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4282. end
  4283. else
  4284. begin
  4285. if cgsetflags or setflags then
  4286. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4287. list.concat(setoppostfix(
  4288. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4289. end;
  4290. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  4291. begin
  4292. ovloc.loc:=LOC_FLAGS;
  4293. case op of
  4294. OP_ADD:
  4295. ovloc.resflags:=F_CS;
  4296. OP_SUB:
  4297. ovloc.resflags:=F_CC;
  4298. else
  4299. ;
  4300. end;
  4301. end;
  4302. end
  4303. else
  4304. begin
  4305. { there could be added some more sophisticated optimizations }
  4306. if (op in [OP_MUL,OP_IMUL]) and (a=1) then
  4307. a_load_reg_reg(list,size,size,src,dst)
  4308. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  4309. a_load_const_reg(list,size,0,dst)
  4310. else if (op in [OP_IMUL]) and (a=-1) then
  4311. a_op_reg_reg(list,OP_NEG,size,src,dst)
  4312. { we do this here instead in the peephole optimizer because
  4313. it saves us a register }
  4314. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  4315. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  4316. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  4317. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  4318. begin
  4319. if l1>32 then{roozbeh does this ever happen?}
  4320. internalerror(2003082911);
  4321. shifterop_reset(so);
  4322. so.shiftmode:=SM_LSL;
  4323. so.shiftimm:=l1;
  4324. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  4325. end
  4326. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  4327. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  4328. begin
  4329. if l1>32 then{does this ever happen?}
  4330. internalerror(2012051803);
  4331. shifterop_reset(so);
  4332. so.shiftmode:=SM_LSL;
  4333. so.shiftimm:=l1;
  4334. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  4335. end
  4336. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  4337. begin
  4338. { nothing to do on success }
  4339. end
  4340. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  4341. Just using mov x, #0 might allow some easier optimizations down the line. }
  4342. else if (op = OP_AND) and (dword(a)=0) then
  4343. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  4344. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  4345. else if (op = OP_AND) and (not(dword(a))=0) then
  4346. list.concat(taicpu.op_reg_reg(A_MOV,dst,src))
  4347. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  4348. broader range of shifterconstants.}
  4349. {else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  4350. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))}
  4351. else if (op = OP_AND) and is_thumb32_imm(a) then
  4352. list.concat(taicpu.op_reg_reg_const(A_AND,dst,src,dword(a)))
  4353. else if (op = OP_AND) and (a = $FFFF) then
  4354. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  4355. else if (op = OP_AND) and is_thumb32_imm(not(dword(a))) then
  4356. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  4357. else if (op = OP_AND) and is_continuous_mask(aword(not(a)), shift, width) then
  4358. begin
  4359. a_load_reg_reg(list,size,size,src,dst);
  4360. list.concat(taicpu.op_reg_const_const(A_BFC,dst,shift,width))
  4361. end
  4362. else
  4363. begin
  4364. tmpreg:=getintregister(list,size);
  4365. a_load_const_reg(list,size,a,tmpreg);
  4366. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  4367. end;
  4368. end;
  4369. maybeadjustresult(list,op,size,dst);
  4370. end;
  4371. const
  4372. op_reg_reg_opcg2asmopThumb2: array[TOpCG] of tasmop =
  4373. (A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NONE,A_MVN,A_ORR,
  4374. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  4375. procedure tthumb2cgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4376. var
  4377. so : tshifterop;
  4378. tmpreg,overflowreg : tregister;
  4379. asmop : tasmop;
  4380. begin
  4381. ovloc.loc:=LOC_VOID;
  4382. case op of
  4383. OP_NEG,OP_NOT:
  4384. internalerror(200308286);
  4385. OP_ROL:
  4386. begin
  4387. if not(size in [OS_32,OS_S32]) then
  4388. internalerror(2008072806);
  4389. { simulate ROL by ror'ing 32-value }
  4390. tmpreg:=getintregister(list,OS_32);
  4391. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,32));
  4392. list.concat(taicpu.op_reg_reg_reg(A_SUB,src1,tmpreg,src1));
  4393. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4394. end;
  4395. OP_ROR:
  4396. begin
  4397. if not(size in [OS_32,OS_S32]) then
  4398. internalerror(2008072802);
  4399. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4400. end;
  4401. OP_IMUL,
  4402. OP_MUL:
  4403. begin
  4404. if cgsetflags or setflags then
  4405. begin
  4406. overflowreg:=getintregister(list,size);
  4407. if op=OP_IMUL then
  4408. asmop:=A_SMULL
  4409. else
  4410. asmop:=A_UMULL;
  4411. { the arm doesn't allow that rd and rm are the same }
  4412. if dst=src2 then
  4413. begin
  4414. if dst<>src1 then
  4415. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  4416. else
  4417. begin
  4418. tmpreg:=getintregister(list,size);
  4419. a_load_reg_reg(list,size,size,src2,dst);
  4420. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  4421. end;
  4422. end
  4423. else
  4424. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  4425. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4426. if op=OP_IMUL then
  4427. begin
  4428. shifterop_reset(so);
  4429. so.shiftmode:=SM_ASR;
  4430. so.shiftimm:=31;
  4431. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  4432. end
  4433. else
  4434. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  4435. ovloc.loc:=LOC_FLAGS;
  4436. ovloc.resflags:=F_NE;
  4437. end
  4438. else
  4439. begin
  4440. { the arm doesn't allow that rd and rm are the same }
  4441. if dst=src2 then
  4442. begin
  4443. if dst<>src1 then
  4444. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  4445. else
  4446. begin
  4447. tmpreg:=getintregister(list,size);
  4448. a_load_reg_reg(list,size,size,src2,dst);
  4449. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  4450. end;
  4451. end
  4452. else
  4453. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  4454. end;
  4455. end;
  4456. else
  4457. begin
  4458. if cgsetflags or setflags then
  4459. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4460. {$ifdef dummy}
  4461. { R13 is not allowed for certain instruction operands }
  4462. if op_reg_reg_opcg2asmopThumb2[op] in [A_ADD,A_SUB,A_AND,A_BIC,A_EOR] then
  4463. begin
  4464. if getsupreg(dst)=RS_R13 then
  4465. begin
  4466. tmpreg:=getintregister(list,OS_INT);
  4467. a_load_reg_reg(list,OS_INT,OS_INT,dst,tmpreg);
  4468. dst:=tmpreg;
  4469. end;
  4470. if getsupreg(src1)=RS_R13 then
  4471. begin
  4472. tmpreg:=getintregister(list,OS_INT);
  4473. a_load_reg_reg(list,OS_INT,OS_INT,src1,tmpreg);
  4474. src1:=tmpreg;
  4475. end;
  4476. end;
  4477. {$endif}
  4478. list.concat(setoppostfix(
  4479. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmopThumb2[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4480. end;
  4481. end;
  4482. maybeadjustresult(list,op,size,dst);
  4483. end;
  4484. procedure tthumb2cgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  4485. begin
  4486. list.concat(taicpu.op_cond(A_ITE, flags_to_cond(f)));
  4487. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  4488. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  4489. end;
  4490. procedure tthumb2cgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  4491. var
  4492. ref : treference;
  4493. shift : byte;
  4494. firstfloatreg,lastfloatreg,
  4495. r : byte;
  4496. regs : tcpuregisterset;
  4497. stackmisalignment: pint;
  4498. begin
  4499. LocalSize:=align(LocalSize,4);
  4500. { call instruction does not put anything on the stack }
  4501. stackmisalignment:=0;
  4502. if not(nostackframe) then
  4503. begin
  4504. firstfloatreg:=RS_NO;
  4505. lastfloatreg:=RS_NO;
  4506. if FPUARM_HAS_FPA in fpu_capabilities[current_settings.fputype] then
  4507. begin
  4508. { save floating point registers? }
  4509. for r:=RS_F0 to RS_F7 do
  4510. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4511. begin
  4512. if firstfloatreg=RS_NO then
  4513. firstfloatreg:=r;
  4514. lastfloatreg:=r;
  4515. inc(stackmisalignment,12);
  4516. end;
  4517. end;
  4518. a_reg_alloc(list,NR_STACK_POINTER_REG);
  4519. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4520. begin
  4521. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  4522. a_reg_alloc(list,NR_R12);
  4523. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  4524. end;
  4525. { save int registers }
  4526. reference_reset(ref,4,[]);
  4527. ref.index:=NR_STACK_POINTER_REG;
  4528. ref.addressmode:=AM_PREINDEXED;
  4529. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4530. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4531. regs:=regs+[RS_FRAME_POINTER_REG,RS_R14]
  4532. else if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  4533. include(regs,RS_R14);
  4534. if regs<>[] then
  4535. begin
  4536. for r:=RS_R0 to RS_R15 do
  4537. if (r in regs) then
  4538. inc(stackmisalignment,4);
  4539. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4540. end;
  4541. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4542. begin
  4543. { the framepointer now points to the saved R15, so the saved
  4544. framepointer is at R11-12 (for get_caller_frame) }
  4545. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  4546. a_reg_dealloc(list,NR_R12);
  4547. end;
  4548. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4549. if (LocalSize<>0) or
  4550. ((stackmisalignment<>0) and
  4551. ((pi_do_call in current_procinfo.flags) or
  4552. (po_assembler in current_procinfo.procdef.procoptions))) then
  4553. begin
  4554. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4555. if not(is_shifter_const(localsize,shift)) then
  4556. begin
  4557. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  4558. a_reg_alloc(list,NR_R12);
  4559. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4560. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  4561. a_reg_dealloc(list,NR_R12);
  4562. end
  4563. else
  4564. begin
  4565. a_reg_dealloc(list,NR_R12);
  4566. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  4567. end;
  4568. end;
  4569. if FPUARM_HAS_FPA in fpu_capabilities[current_settings.fputype] then
  4570. begin
  4571. if firstfloatreg<>RS_NO then
  4572. begin
  4573. reference_reset(ref,4,[]);
  4574. if tg.direction*tcpuprocinfo(current_procinfo).floatregstart>=1023 then
  4575. begin
  4576. a_load_const_reg(list,OS_ADDR,-tcpuprocinfo(current_procinfo).floatregstart,NR_R12);
  4577. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4578. ref.base:=NR_R12;
  4579. end
  4580. else
  4581. begin
  4582. ref.base:=current_procinfo.framepointer;
  4583. ref.offset:=tcpuprocinfo(current_procinfo).floatregstart;
  4584. end;
  4585. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4586. lastfloatreg-firstfloatreg+1,ref));
  4587. end;
  4588. end;
  4589. end;
  4590. end;
  4591. procedure tthumb2cgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  4592. var
  4593. ref : treference;
  4594. firstfloatreg,lastfloatreg,
  4595. r : byte;
  4596. shift : byte;
  4597. regs : tcpuregisterset;
  4598. LocalSize : longint;
  4599. stackmisalignment: pint;
  4600. begin
  4601. if not(nostackframe) then
  4602. begin
  4603. stackmisalignment:=0;
  4604. if FPUARM_HAS_FPA in fpu_capabilities[current_settings.fputype] then
  4605. begin
  4606. { restore floating point register }
  4607. firstfloatreg:=RS_NO;
  4608. lastfloatreg:=RS_NO;
  4609. { save floating point registers? }
  4610. for r:=RS_F0 to RS_F7 do
  4611. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4612. begin
  4613. if firstfloatreg=RS_NO then
  4614. firstfloatreg:=r;
  4615. lastfloatreg:=r;
  4616. { floating point register space is already included in
  4617. localsize below by calc_stackframe_size
  4618. inc(stackmisalignment,12);
  4619. }
  4620. end;
  4621. if firstfloatreg<>RS_NO then
  4622. begin
  4623. reference_reset(ref,4,[]);
  4624. if tg.direction*tcpuprocinfo(current_procinfo).floatregstart>=1023 then
  4625. begin
  4626. a_load_const_reg(list,OS_ADDR,-tcpuprocinfo(current_procinfo).floatregstart,NR_R12);
  4627. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4628. ref.base:=NR_R12;
  4629. end
  4630. else
  4631. begin
  4632. ref.base:=current_procinfo.framepointer;
  4633. ref.offset:=tcpuprocinfo(current_procinfo).floatregstart;
  4634. end;
  4635. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4636. lastfloatreg-firstfloatreg+1,ref));
  4637. end;
  4638. end;
  4639. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4640. if (pi_do_call in current_procinfo.flags) or (regs<>[]) then
  4641. begin
  4642. exclude(regs,RS_R14);
  4643. include(regs,RS_R15);
  4644. end;
  4645. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  4646. regs:=regs+[RS_FRAME_POINTER_REG,RS_R15];
  4647. for r:=RS_R0 to RS_R15 do
  4648. if (r in regs) then
  4649. inc(stackmisalignment,4);
  4650. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4651. LocalSize:=current_procinfo.calc_stackframe_size;
  4652. if (LocalSize<>0) or
  4653. ((stackmisalignment<>0) and
  4654. ((pi_do_call in current_procinfo.flags) or
  4655. (po_assembler in current_procinfo.procdef.procoptions))) then
  4656. begin
  4657. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4658. if not(is_shifter_const(LocalSize,shift)) then
  4659. begin
  4660. a_reg_alloc(list,NR_R12);
  4661. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4662. list.concat(taicpu.op_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_R12));
  4663. a_reg_dealloc(list,NR_R12);
  4664. end
  4665. else
  4666. begin
  4667. a_reg_dealloc(list,NR_R12);
  4668. list.concat(taicpu.op_reg_const(A_ADD,NR_STACK_POINTER_REG,LocalSize));
  4669. end;
  4670. end;
  4671. if regs=[] then
  4672. list.concat(taicpu.op_reg(A_BX,NR_R14))
  4673. else
  4674. begin
  4675. reference_reset(ref,4,[]);
  4676. ref.index:=NR_STACK_POINTER_REG;
  4677. ref.addressmode:=AM_PREINDEXED;
  4678. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4679. end;
  4680. end
  4681. else
  4682. list.concat(taicpu.op_reg(A_BX,NR_R14));
  4683. end;
  4684. function tthumb2cgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  4685. var
  4686. tmpreg : tregister;
  4687. tmpref : treference;
  4688. l : tasmlabel;
  4689. begin
  4690. tmpreg:=NR_NO;
  4691. { Be sure to have a base register }
  4692. if (ref.base=NR_NO) then
  4693. begin
  4694. if ref.shiftmode<>SM_None then
  4695. internalerror(2014020706);
  4696. ref.base:=ref.index;
  4697. ref.index:=NR_NO;
  4698. end;
  4699. { absolute symbols can't be handled directly, we've to store the symbol reference
  4700. in the text segment and access it pc relative
  4701. For now, we assume that references where base or index equals to PC are already
  4702. relative, all other references are assumed to be absolute and thus they need
  4703. to be handled extra.
  4704. A proper solution would be to change refoptions to a set and store the information
  4705. if the symbol is absolute or relative there.
  4706. }
  4707. if (assigned(ref.symbol) and
  4708. not(is_pc(ref.base)) and
  4709. not(is_pc(ref.index))
  4710. ) or
  4711. { [#xxx] isn't a valid address operand }
  4712. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  4713. //(ref.offset<-4095) or
  4714. (ref.offset<-255) or
  4715. (ref.offset>4095) or
  4716. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  4717. ((ref.offset<-255) or
  4718. (ref.offset>255)
  4719. )
  4720. ) or
  4721. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  4722. ((ref.offset<-1020) or
  4723. (ref.offset>1020) or
  4724. ((abs(ref.offset) mod 4)<>0) or
  4725. { the usual pc relative symbol handling assumes possible offsets of +/- 4095 }
  4726. assigned(ref.symbol)
  4727. )
  4728. ) then
  4729. begin
  4730. reference_reset(tmpref,4,[]);
  4731. { load symbol }
  4732. tmpreg:=getintregister(list,OS_INT);
  4733. if assigned(ref.symbol) then
  4734. begin
  4735. current_asmdata.getjumplabel(l);
  4736. cg.a_label(current_procinfo.aktlocaldata,l);
  4737. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  4738. if ref.refaddr=addr_gottpoff then
  4739. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_gottpoff,ref.symbol,ref.relsymbol,ref.offset))
  4740. else if ref.refaddr=addr_tlsgd then
  4741. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_tlsgd,ref.symbol,ref.relsymbol,ref.offset))
  4742. else if ref.refaddr=addr_tlsdesc then
  4743. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_tlsdesc,ref.symbol,ref.relsymbol,ref.offset))
  4744. else if ref.refaddr=addr_tpoff then
  4745. begin
  4746. if assigned(ref.relsymbol) or (ref.offset<>0) then
  4747. Internalerror(2019092807);
  4748. current_procinfo.aktlocaldata.concat(tai_const.Create_type_sym(aitconst_tpoff,ref.symbol));
  4749. end
  4750. else
  4751. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset));
  4752. { load consts entry }
  4753. tmpref.symbol:=l;
  4754. tmpref.base:=NR_R15;
  4755. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  4756. { in case of LDF/STF, we got rid of the NR_R15 }
  4757. if is_pc(ref.base) then
  4758. ref.base:=NR_NO;
  4759. if is_pc(ref.index) then
  4760. ref.index:=NR_NO;
  4761. end
  4762. else
  4763. a_load_const_reg(list,OS_ADDR,ref.offset,tmpreg);
  4764. if (ref.base<>NR_NO) then
  4765. begin
  4766. if ref.index<>NR_NO then
  4767. begin
  4768. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4769. ref.base:=tmpreg;
  4770. end
  4771. else
  4772. begin
  4773. ref.index:=tmpreg;
  4774. ref.shiftimm:=0;
  4775. ref.signindex:=1;
  4776. ref.shiftmode:=SM_None;
  4777. end;
  4778. end
  4779. else
  4780. ref.base:=tmpreg;
  4781. ref.offset:=0;
  4782. ref.symbol:=nil;
  4783. end;
  4784. if (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  4785. begin
  4786. if tmpreg<>NR_NO then
  4787. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg,tmpreg)
  4788. else
  4789. begin
  4790. tmpreg:=getintregister(list,OS_ADDR);
  4791. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg);
  4792. ref.base:=tmpreg;
  4793. end;
  4794. ref.offset:=0;
  4795. end;
  4796. { Hack? Thumb2 doesn't allow PC indexed addressing modes(although it does in the specification) }
  4797. if (ref.base=NR_R15) and (ref.index<>NR_NO) and (ref.shiftmode <> sm_none) then
  4798. begin
  4799. tmpreg:=getintregister(list,OS_ADDR);
  4800. list.concat(taicpu.op_reg_reg(A_MOV, tmpreg, NR_R15));
  4801. ref.base := tmpreg;
  4802. end;
  4803. { floating point operations have only limited references
  4804. we expect here, that a base is already set }
  4805. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  4806. begin
  4807. if ref.shiftmode<>SM_none then
  4808. internalerror(2003091202);
  4809. if tmpreg<>NR_NO then
  4810. begin
  4811. if ref.base=tmpreg then
  4812. begin
  4813. if ref.signindex<0 then
  4814. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,tmpreg,ref.index))
  4815. else
  4816. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,tmpreg,ref.index));
  4817. ref.index:=NR_NO;
  4818. end
  4819. else
  4820. begin
  4821. if ref.index<>tmpreg then
  4822. internalerror(2004031602);
  4823. if ref.signindex<0 then
  4824. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,ref.base,tmpreg))
  4825. else
  4826. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4827. ref.base:=tmpreg;
  4828. ref.index:=NR_NO;
  4829. end;
  4830. end
  4831. else
  4832. begin
  4833. tmpreg:=getintregister(list,OS_ADDR);
  4834. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));
  4835. ref.base:=tmpreg;
  4836. ref.index:=NR_NO;
  4837. end;
  4838. end;
  4839. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  4840. Result := ref;
  4841. end;
  4842. procedure tthumb2cgarm.a_loadmm_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister; shuffle: pmmshuffle);
  4843. var
  4844. instr: taicpu;
  4845. begin
  4846. if (fromsize=OS_F32) and
  4847. (tosize=OS_F32) then
  4848. begin
  4849. instr:=setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32);
  4850. list.Concat(instr);
  4851. add_move_instruction(instr);
  4852. { VMOV cannot generate an FPU exception, so we do not need a check here }
  4853. end
  4854. else if (fromsize=OS_F64) and
  4855. (tosize=OS_F64) then
  4856. begin
  4857. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,tregister(longint(reg2)+1),tregister(longint(reg1)+1)), PF_F32));
  4858. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32));
  4859. end
  4860. else if (fromsize=OS_F32) and
  4861. (tosize=OS_F64) then
  4862. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VCVT,reg2,reg1), PF_F32))
  4863. begin
  4864. //list.concat(nil);
  4865. end;
  4866. end;
  4867. procedure tthumb2cgarm.a_loadmm_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  4868. begin
  4869. handle_load_store(list,A_VLDR,PF_None,reg,ref);
  4870. end;
  4871. procedure tthumb2cgarm.a_loadmm_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  4872. begin
  4873. handle_load_store(list,A_VSTR,PF_None,reg,ref);
  4874. { VSTR cannot generate an FPU exception, so we do not need a check here }
  4875. end;
  4876. procedure tthumb2cgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize: tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  4877. begin
  4878. if //(shuffle=nil) and
  4879. (tosize=OS_F32) then
  4880. list.Concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg))
  4881. else
  4882. internalerror(2012100813);
  4883. end;
  4884. procedure tthumb2cgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize: tcgsize; mmreg, intreg: tregister; shuffle: pmmshuffle);
  4885. begin
  4886. if //(shuffle=nil) and
  4887. (fromsize=OS_F32) then
  4888. begin
  4889. list.Concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg));
  4890. { VMOV cannot generate an FPU exception, so we do not need a check here }
  4891. end
  4892. else
  4893. internalerror(2012100814);
  4894. end;
  4895. procedure tthumb2cg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  4896. var tmpreg: tregister;
  4897. begin
  4898. case op of
  4899. OP_NEG:
  4900. begin
  4901. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4902. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  4903. tmpreg:=cg.getintregister(list,OS_32);
  4904. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,0));
  4905. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,tmpreg,regsrc.reghi));
  4906. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4907. end;
  4908. else
  4909. inherited a_op64_reg_reg(list, op, size, regsrc, regdst);
  4910. end;
  4911. end;
  4912. procedure tthumbcg64farm.a_op64_reg_reg(list: TAsmList; op: TOpCG; size: tcgsize; regsrc, regdst: tregister64);
  4913. begin
  4914. case op of
  4915. OP_NEG:
  4916. begin
  4917. list.concat(setoppostfix(taicpu.op_reg_const(A_MOV,regdst.reglo,0),PF_S));
  4918. list.concat(setoppostfix(taicpu.op_reg_const(A_MOV,regdst.reghi,0),PF_S));
  4919. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4920. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4921. list.concat(setoppostfix(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi),PF_S));
  4922. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4923. end;
  4924. OP_NOT:
  4925. begin
  4926. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  4927. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  4928. end;
  4929. OP_AND,OP_OR,OP_XOR:
  4930. begin
  4931. cg.a_op_reg_reg(list,op,OS_32,regsrc.reglo,regdst.reglo);
  4932. cg.a_op_reg_reg(list,op,OS_32,regsrc.reghi,regdst.reghi);
  4933. end;
  4934. OP_ADD:
  4935. begin
  4936. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4937. list.concat(taicpu.op_reg_reg(A_ADD,regdst.reglo,regsrc.reglo));
  4938. list.concat(setoppostfix(taicpu.op_reg_reg(A_ADC,regdst.reghi,regsrc.reghi),PF_S));
  4939. end;
  4940. OP_SUB:
  4941. begin
  4942. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4943. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4944. list.concat(setoppostfix(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi),PF_S));
  4945. end;
  4946. else
  4947. internalerror(2003083105);
  4948. end;
  4949. end;
  4950. procedure tthumbcg64farm.a_op64_const_reg(list: TAsmList; op: TOpCG; size: tcgsize; value: int64; reg: tregister64);
  4951. var
  4952. tmpreg : tregister;
  4953. begin
  4954. case op of
  4955. OP_AND,OP_OR,OP_XOR:
  4956. begin
  4957. cg.a_op_const_reg(list,op,OS_32,aint(lo(value)),reg.reglo);
  4958. cg.a_op_const_reg(list,op,OS_32,aint(hi(value)),reg.reghi);
  4959. end;
  4960. OP_ADD:
  4961. begin
  4962. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4963. begin
  4964. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4965. list.concat(taicpu.op_reg_const(A_ADD,reg.reglo,aint(lo(value))));
  4966. end
  4967. else
  4968. begin
  4969. tmpreg:=cg.getintregister(list,OS_32);
  4970. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4971. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4972. list.concat(taicpu.op_reg_reg(A_ADD,reg.reglo,tmpreg));
  4973. end;
  4974. tmpreg:=cg.getintregister(list,OS_32);
  4975. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  4976. list.concat(setoppostfix(taicpu.op_reg_reg(A_ADC,reg.reghi,tmpreg),PF_S));
  4977. end;
  4978. OP_SUB:
  4979. begin
  4980. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4981. begin
  4982. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4983. list.concat(taicpu.op_reg_const(A_SUB,reg.reglo,aint(lo(value))))
  4984. end
  4985. else
  4986. begin
  4987. tmpreg:=cg.getintregister(list,OS_32);
  4988. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4989. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4990. list.concat(taicpu.op_reg_reg(A_SUB,reg.reglo,tmpreg));
  4991. end;
  4992. tmpreg:=cg.getintregister(list,OS_32);
  4993. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  4994. list.concat(setoppostfix(taicpu.op_reg_reg(A_SBC,reg.reghi,tmpreg),PF_S));
  4995. end;
  4996. else
  4997. internalerror(2003083106);
  4998. end;
  4999. end;
  5000. procedure create_codegen;
  5001. begin
  5002. if GenerateThumb2Code then
  5003. begin
  5004. cg:=tthumb2cgarm.create;
  5005. cg64:=tthumb2cg64farm.create;
  5006. casmoptimizer:=TCpuThumb2AsmOptimizer;
  5007. end
  5008. else if GenerateThumbCode then
  5009. begin
  5010. cg:=tthumbcgarm.create;
  5011. cg64:=tthumbcg64farm.create;
  5012. // casmoptimizer:=TCpuThumbAsmOptimizer;
  5013. end
  5014. else
  5015. begin
  5016. cg:=tarmcgarm.create;
  5017. cg64:=tarmcg64farm.create;
  5018. casmoptimizer:=TCpuAsmOptimizer;
  5019. end;
  5020. end;
  5021. end.