cgcpu.pas 213 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889389038913892389338943895389638973898389939003901390239033904390539063907390839093910391139123913391439153916391739183919392039213922392339243925392639273928392939303931393239333934393539363937393839393940394139423943394439453946394739483949395039513952395339543955395639573958395939603961396239633964396539663967396839693970397139723973397439753976397739783979398039813982398339843985398639873988398939903991399239933994399539963997399839994000400140024003400440054006400740084009401040114012401340144015401640174018401940204021402240234024402540264027402840294030403140324033403440354036403740384039404040414042404340444045404640474048404940504051405240534054405540564057405840594060406140624063406440654066406740684069407040714072407340744075407640774078407940804081408240834084408540864087408840894090409140924093409440954096409740984099410041014102410341044105410641074108410941104111411241134114411541164117411841194120412141224123412441254126412741284129413041314132413341344135413641374138413941404141414241434144414541464147414841494150415141524153415441554156415741584159416041614162416341644165416641674168416941704171417241734174417541764177417841794180418141824183418441854186418741884189419041914192419341944195419641974198419942004201420242034204420542064207420842094210421142124213421442154216421742184219422042214222422342244225422642274228422942304231423242334234423542364237423842394240424142424243424442454246424742484249425042514252425342544255425642574258425942604261426242634264426542664267426842694270427142724273427442754276427742784279428042814282428342844285428642874288428942904291429242934294429542964297429842994300430143024303430443054306430743084309431043114312431343144315431643174318431943204321432243234324432543264327432843294330433143324333433443354336433743384339434043414342434343444345434643474348434943504351435243534354435543564357435843594360436143624363436443654366436743684369437043714372437343744375437643774378437943804381438243834384438543864387438843894390439143924393439443954396439743984399440044014402440344044405440644074408440944104411441244134414441544164417441844194420442144224423442444254426442744284429443044314432443344344435443644374438443944404441444244434444444544464447444844494450445144524453445444554456445744584459446044614462446344644465446644674468446944704471447244734474447544764477447844794480448144824483448444854486448744884489449044914492449344944495449644974498449945004501450245034504450545064507450845094510451145124513451445154516451745184519452045214522452345244525452645274528452945304531453245334534453545364537453845394540454145424543454445454546454745484549455045514552455345544555455645574558455945604561456245634564456545664567456845694570457145724573457445754576457745784579458045814582458345844585458645874588458945904591459245934594459545964597459845994600460146024603460446054606460746084609461046114612461346144615461646174618461946204621462246234624462546264627462846294630463146324633463446354636463746384639464046414642464346444645464646474648464946504651465246534654465546564657465846594660466146624663466446654666466746684669467046714672467346744675467646774678467946804681468246834684468546864687468846894690469146924693469446954696469746984699470047014702470347044705470647074708470947104711471247134714471547164717471847194720472147224723472447254726472747284729473047314732473347344735473647374738473947404741474247434744474547464747474847494750475147524753475447554756475747584759476047614762476347644765476647674768476947704771477247734774477547764777477847794780478147824783478447854786478747884789479047914792479347944795479647974798479948004801480248034804480548064807480848094810481148124813481448154816481748184819482048214822482348244825482648274828482948304831483248334834483548364837483848394840484148424843484448454846484748484849485048514852485348544855485648574858485948604861486248634864486548664867486848694870487148724873487448754876487748784879488048814882488348844885488648874888488948904891489248934894489548964897489848994900490149024903490449054906490749084909491049114912491349144915491649174918491949204921492249234924492549264927492849294930493149324933493449354936493749384939494049414942494349444945494649474948494949504951495249534954495549564957495849594960496149624963496449654966496749684969497049714972497349744975497649774978497949804981498249834984498549864987498849894990499149924993499449954996499749984999500050015002500350045005500650075008500950105011501250135014501550165017501850195020502150225023502450255026502750285029503050315032503350345035503650375038503950405041504250435044504550465047504850495050505150525053505450555056505750585059506050615062506350645065506650675068506950705071507250735074507550765077507850795080508150825083508450855086508750885089509050915092509350945095509650975098509951005101510251035104510551065107510851095110511151125113511451155116511751185119512051215122512351245125512651275128512951305131513251335134513551365137513851395140514151425143514451455146514751485149515051515152515351545155515651575158515951605161516251635164516551665167516851695170517151725173517451755176517751785179518051815182518351845185518651875188518951905191519251935194519551965197519851995200520152025203520452055206520752085209521052115212521352145215521652175218521952205221522252235224522552265227522852295230523152325233523452355236523752385239524052415242524352445245524652475248524952505251525252535254525552565257525852595260526152625263526452655266526752685269527052715272527352745275527652775278527952805281528252835284528552865287528852895290529152925293529452955296529752985299530053015302530353045305530653075308530953105311531253135314531553165317531853195320532153225323532453255326
  1. {
  2. Copyright (c) 2003 by Florian Klaempfl
  3. Member of the Free Pascal development team
  4. This unit implements the code generator for the ARM
  5. This program is free software; you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation; either version 2 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program; if not, write to the Free Software
  15. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  16. ****************************************************************************
  17. }
  18. unit cgcpu;
  19. {$i fpcdefs.inc}
  20. interface
  21. uses
  22. globtype,symtype,symdef,
  23. cgbase,cgutils,cgobj,
  24. aasmbase,aasmcpu,aasmtai,aasmdata,
  25. parabase,
  26. cpubase,cpuinfo,cg64f32,rgcpu;
  27. type
  28. { tbasecgarm is shared between all arm architectures }
  29. tbasecgarm = class(tcg)
  30. { true, if the next arithmetic operation should modify the flags }
  31. cgsetflags : boolean;
  32. procedure a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);override;
  33. procedure a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);override;
  34. procedure a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);override;
  35. procedure a_call_name(list : TAsmList;const s : string; weak: boolean);override;
  36. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  37. { move instructions }
  38. procedure a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);override;
  39. procedure a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);override;
  40. function a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  41. function a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  42. { fpu move instructions }
  43. procedure a_loadfpu_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister); override;
  44. procedure a_loadfpu_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister); override;
  45. procedure a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference); override;
  46. procedure a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);override;
  47. { comparison operations }
  48. procedure a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  49. l : tasmlabel);override;
  50. procedure a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel); override;
  51. procedure a_jmp_name(list : TAsmList;const s : string); override;
  52. procedure a_jmp_always(list : TAsmList;l: tasmlabel); override;
  53. procedure a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel); override;
  54. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  55. procedure g_profilecode(list : TAsmList); override;
  56. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  57. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  58. procedure g_maybe_got_init(list : TAsmList); override;
  59. procedure a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);override;
  60. procedure g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);override;
  61. procedure g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);override;
  62. procedure g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  63. procedure g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  64. procedure g_overflowcheck(list: TAsmList; const l: tlocation; def: tdef); override;
  65. procedure g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);override;
  66. procedure g_save_registers(list : TAsmList);override;
  67. procedure g_restore_registers(list : TAsmList);override;
  68. procedure a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  69. procedure fixref(list : TAsmList;var ref : treference);
  70. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; virtual;
  71. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  72. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  73. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  74. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  75. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  76. procedure a_opmm_reg_reg(list: TAsmList; Op: TOpCG; size : tcgsize;src,dst: tregister;shuffle : pmmshuffle); override;
  77. { Transform unsupported methods into Internal errors }
  78. procedure a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister); override;
  79. { try to generate optimized 32 Bit multiplication, returns true if successful generated }
  80. function try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  81. { clear out potential overflow bits from 8 or 16 bit operations }
  82. { the upper 24/16 bits of a register after an operation }
  83. procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  84. { mla for thumb requires that none of the registers is equal to r13/r15, this method ensures this }
  85. procedure safe_mla(list: TAsmList;op1,op2,op3,op4 : TRegister);
  86. end;
  87. { tcgarm is shared between normal arm and thumb-2 }
  88. tcgarm = class(tbasecgarm)
  89. procedure a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister); override;
  90. procedure a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference); override;
  91. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  92. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  93. size: tcgsize; a: tcgint; src, dst: tregister); override;
  94. procedure a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  95. size: tcgsize; src1, src2, dst: tregister); override;
  96. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  97. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  98. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  99. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  100. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  101. {Multiply two 32-bit registers into lo and hi 32-bit registers}
  102. procedure a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister); override;
  103. end;
  104. { normal arm cg }
  105. tarmcgarm = class(tcgarm)
  106. procedure init_register_allocators;override;
  107. procedure done_register_allocators;override;
  108. end;
  109. { 64 bit cg for all arm flavours }
  110. tbasecg64farm = class(tcg64f32)
  111. end;
  112. { tcg64farm is shared between normal arm and thumb-2 }
  113. tcg64farm = class(tbasecg64farm)
  114. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  115. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  116. procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;
  117. procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  118. procedure a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  119. procedure a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  120. procedure a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);override;
  121. procedure a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);override;
  122. end;
  123. tarmcg64farm = class(tcg64farm)
  124. end;
  125. tthumbcgarm = class(tbasecgarm)
  126. procedure init_register_allocators;override;
  127. procedure done_register_allocators;override;
  128. procedure g_proc_entry(list: TAsmList; localsize: longint; nostackframe: boolean);override;
  129. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  130. procedure a_op_reg_reg(list: TAsmList; Op: TOpCG; size: TCGSize; src,dst: TRegister);override;
  131. procedure a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);override;
  132. procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister); override;
  133. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  134. procedure a_load_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const Ref: treference; reg: tregister);override;
  135. procedure a_load_const_reg(list: TAsmList; size: tcgsize; a: tcgint; reg: tregister);override;
  136. procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint); override;
  137. function handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference; override;
  138. end;
  139. tthumbcg64farm = class(tbasecg64farm)
  140. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  141. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  142. end;
  143. tthumb2cgarm = class(tcgarm)
  144. procedure init_register_allocators;override;
  145. procedure done_register_allocators;override;
  146. procedure a_call_reg(list : TAsmList;reg: tregister);override;
  147. procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);override;
  148. procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;
  149. procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;
  150. procedure a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  151. procedure a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);override;
  152. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;
  153. procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;
  154. procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;
  155. function handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference; override;
  156. procedure a_loadmm_reg_reg(list: TAsmList; fromsize, tosize : tcgsize;reg1, reg2: tregister;shuffle : pmmshuffle); override;
  157. procedure a_loadmm_ref_reg(list: TAsmList; fromsize, tosize : tcgsize;const ref: treference; reg: tregister;shuffle : pmmshuffle); override;
  158. procedure a_loadmm_reg_ref(list: TAsmList; fromsize, tosize : tcgsize;reg: tregister; const ref: treference;shuffle : pmmshuffle); override;
  159. procedure a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize;intreg, mmreg: tregister; shuffle: pmmshuffle); override;
  160. procedure a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize;mmreg, intreg: tregister; shuffle : pmmshuffle); override;
  161. end;
  162. tthumb2cg64farm = class(tcg64farm)
  163. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  164. end;
  165. const
  166. OpCmp2AsmCond : Array[topcmp] of TAsmCond = (C_NONE,C_EQ,C_GT,
  167. C_LT,C_GE,C_LE,C_NE,C_LS,C_CC,C_CS,C_HI);
  168. winstackpagesize = 4096;
  169. function get_fpu_postfix(def : tdef) : toppostfix;
  170. procedure create_codegen;
  171. implementation
  172. uses
  173. globals,verbose,systems,cutils,
  174. aopt,aoptcpu,
  175. fmodule,
  176. symconst,symsym,symtable,
  177. tgobj,
  178. procinfo,cpupi,
  179. paramgr;
  180. function get_fpu_postfix(def : tdef) : toppostfix;
  181. begin
  182. if def.typ=floatdef then
  183. begin
  184. case tfloatdef(def).floattype of
  185. s32real:
  186. result:=PF_S;
  187. s64real:
  188. result:=PF_D;
  189. s80real:
  190. result:=PF_E;
  191. else
  192. internalerror(200401272);
  193. end;
  194. end
  195. else
  196. internalerror(200401271);
  197. end;
  198. procedure tarmcgarm.init_register_allocators;
  199. begin
  200. inherited init_register_allocators;
  201. { currently, we always save R14, so we can use it }
  202. if (target_info.system<>system_arm_darwin) then
  203. begin
  204. if assigned(current_procinfo) and (current_procinfo.framepointer<>NR_R11) then
  205. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  206. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  207. RS_R9,RS_R10,RS_R11,RS_R14],first_int_imreg,[])
  208. else
  209. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  210. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R12,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  211. RS_R9,RS_R10,RS_R14],first_int_imreg,[])
  212. end
  213. else
  214. { r7 is not available on Darwin, it's used as frame pointer (always,
  215. for backtrace support -- also in gcc/clang -> R11 can be used).
  216. r9 is volatile }
  217. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  218. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R9,RS_R12,RS_R4,RS_R5,RS_R6,RS_R8,
  219. RS_R10,RS_R11,RS_R14],first_int_imreg,[]);
  220. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  221. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  222. { The register allocator currently cannot deal with multiple
  223. non-overlapping subregs per register, so we can only use
  224. half the single precision registers for now (as sub registers of the
  225. double precision ones). }
  226. if current_settings.fputype=fpu_vfpv3 then
  227. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  228. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  229. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  230. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  231. ],first_mm_imreg,[])
  232. else
  233. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  234. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15],first_mm_imreg,[]);
  235. end;
  236. procedure tarmcgarm.done_register_allocators;
  237. begin
  238. rg[R_INTREGISTER].free;
  239. rg[R_FPUREGISTER].free;
  240. rg[R_MMREGISTER].free;
  241. inherited done_register_allocators;
  242. end;
  243. procedure tcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  244. var
  245. imm_shift : byte;
  246. l : tasmlabel;
  247. hr : treference;
  248. imm1, imm2: DWord;
  249. begin
  250. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  251. internalerror(2002090902);
  252. if is_shifter_const(a,imm_shift) then
  253. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  254. else if is_shifter_const(not(a),imm_shift) then
  255. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  256. { loading of constants with mov and orr }
  257. else if (split_into_shifter_const(a,imm1, imm2)) then
  258. begin
  259. list.concat(taicpu.op_reg_const(A_MOV,reg, imm1));
  260. list.concat(taicpu.op_reg_reg_const(A_ORR,reg,reg, imm2));
  261. end
  262. { loading of constants with mvn and bic }
  263. else if (split_into_shifter_const(not(a), imm1, imm2)) then
  264. begin
  265. list.concat(taicpu.op_reg_const(A_MVN,reg, imm1));
  266. list.concat(taicpu.op_reg_reg_const(A_BIC,reg,reg, imm2));
  267. end
  268. else
  269. begin
  270. reference_reset(hr,4);
  271. current_asmdata.getjumplabel(l);
  272. cg.a_label(current_procinfo.aktlocaldata,l);
  273. hr.symboldata:=current_procinfo.aktlocaldata.last;
  274. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  275. hr.symbol:=l;
  276. hr.base:=NR_PC;
  277. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  278. end;
  279. end;
  280. procedure tcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  281. var
  282. oppostfix:toppostfix;
  283. usedtmpref: treference;
  284. tmpreg,tmpreg2 : tregister;
  285. so : tshifterop;
  286. dir : integer;
  287. begin
  288. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  289. FromSize := ToSize;
  290. case FromSize of
  291. { signed integer registers }
  292. OS_8:
  293. oppostfix:=PF_B;
  294. OS_S8:
  295. oppostfix:=PF_SB;
  296. OS_16:
  297. oppostfix:=PF_H;
  298. OS_S16:
  299. oppostfix:=PF_SH;
  300. OS_32,
  301. OS_S32:
  302. oppostfix:=PF_None;
  303. else
  304. InternalError(200308297);
  305. end;
  306. if (fromsize=OS_S8) and
  307. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  308. oppostfix:=PF_B;
  309. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize])) or
  310. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  311. (oppostfix in [PF_SH,PF_H])) then
  312. begin
  313. if target_info.endian=endian_big then
  314. dir:=-1
  315. else
  316. dir:=1;
  317. case FromSize of
  318. OS_16,OS_S16:
  319. begin
  320. { only complicated references need an extra loadaddr }
  321. if assigned(ref.symbol) or
  322. (ref.index<>NR_NO) or
  323. (ref.offset<-4095) or
  324. (ref.offset>4094) or
  325. { sometimes the compiler reused registers }
  326. (reg=ref.index) or
  327. (reg=ref.base) then
  328. begin
  329. tmpreg2:=getintregister(list,OS_INT);
  330. a_loadaddr_ref_reg(list,ref,tmpreg2);
  331. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  332. end
  333. else
  334. usedtmpref:=ref;
  335. if target_info.endian=endian_big then
  336. inc(usedtmpref.offset,1);
  337. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  338. tmpreg:=getintregister(list,OS_INT);
  339. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  340. inc(usedtmpref.offset,dir);
  341. if FromSize=OS_16 then
  342. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  343. else
  344. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  345. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  346. end;
  347. OS_32,OS_S32:
  348. begin
  349. tmpreg:=getintregister(list,OS_INT);
  350. { only complicated references need an extra loadaddr }
  351. if assigned(ref.symbol) or
  352. (ref.index<>NR_NO) or
  353. (ref.offset<-4095) or
  354. (ref.offset>4092) or
  355. { sometimes the compiler reused registers }
  356. (reg=ref.index) or
  357. (reg=ref.base) then
  358. begin
  359. tmpreg2:=getintregister(list,OS_INT);
  360. a_loadaddr_ref_reg(list,ref,tmpreg2);
  361. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  362. end
  363. else
  364. usedtmpref:=ref;
  365. shifterop_reset(so);so.shiftmode:=SM_LSL;
  366. if ref.alignment=2 then
  367. begin
  368. if target_info.endian=endian_big then
  369. inc(usedtmpref.offset,2);
  370. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  371. inc(usedtmpref.offset,dir*2);
  372. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  373. so.shiftimm:=16;
  374. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  375. end
  376. else
  377. begin
  378. tmpreg2:=getintregister(list,OS_INT);
  379. if target_info.endian=endian_big then
  380. inc(usedtmpref.offset,3);
  381. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  382. inc(usedtmpref.offset,dir);
  383. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  384. inc(usedtmpref.offset,dir);
  385. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg2);
  386. so.shiftimm:=8;
  387. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  388. inc(usedtmpref.offset,dir);
  389. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  390. so.shiftimm:=16;
  391. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg2,so));
  392. so.shiftimm:=24;
  393. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  394. end;
  395. end
  396. else
  397. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  398. end;
  399. end
  400. else
  401. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  402. if (fromsize=OS_S8) and
  403. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  404. a_load_reg_reg(list,OS_S8,OS_32,reg,reg)
  405. else if (fromsize=OS_S8) and (tosize = OS_16) then
  406. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  407. end;
  408. procedure tcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  409. var
  410. hsym : tsym;
  411. href : treference;
  412. paraloc : Pcgparalocation;
  413. shift : byte;
  414. begin
  415. { calculate the parameter info for the procdef }
  416. procdef.init_paraloc_info(callerside);
  417. hsym:=tsym(procdef.parast.Find('self'));
  418. if not(assigned(hsym) and
  419. (hsym.typ=paravarsym)) then
  420. internalerror(200305251);
  421. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  422. while paraloc<>nil do
  423. with paraloc^ do
  424. begin
  425. case loc of
  426. LOC_REGISTER:
  427. begin
  428. if is_shifter_const(ioffset,shift) then
  429. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  430. else
  431. begin
  432. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  433. a_op_reg_reg(list,OP_SUB,size,NR_R12,register);
  434. end;
  435. end;
  436. LOC_REFERENCE:
  437. begin
  438. { offset in the wrapper needs to be adjusted for the stored
  439. return address }
  440. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),sizeof(pint));
  441. if is_shifter_const(ioffset,shift) then
  442. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  443. else
  444. begin
  445. a_load_const_reg(list,OS_ADDR,ioffset,NR_R12);
  446. a_op_reg_ref(list,OP_SUB,size,NR_R12,href);
  447. end;
  448. end
  449. else
  450. internalerror(200309189);
  451. end;
  452. paraloc:=next;
  453. end;
  454. end;
  455. procedure tbasecgarm.a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const paraloc : TCGPara);
  456. var
  457. ref: treference;
  458. begin
  459. paraloc.check_simple_location;
  460. paramanager.allocparaloc(list,paraloc.location);
  461. case paraloc.location^.loc of
  462. LOC_REGISTER,LOC_CREGISTER:
  463. a_load_const_reg(list,size,a,paraloc.location^.register);
  464. LOC_REFERENCE:
  465. begin
  466. reference_reset(ref,paraloc.alignment);
  467. ref.base:=paraloc.location^.reference.index;
  468. ref.offset:=paraloc.location^.reference.offset;
  469. a_load_const_ref(list,size,a,ref);
  470. end;
  471. else
  472. internalerror(2002081101);
  473. end;
  474. end;
  475. procedure tbasecgarm.a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const paraloc : TCGPara);
  476. var
  477. tmpref, ref: treference;
  478. location: pcgparalocation;
  479. sizeleft: aint;
  480. begin
  481. location := paraloc.location;
  482. tmpref := r;
  483. sizeleft := paraloc.intsize;
  484. while assigned(location) do
  485. begin
  486. paramanager.allocparaloc(list,location);
  487. case location^.loc of
  488. LOC_REGISTER,LOC_CREGISTER:
  489. a_load_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  490. LOC_REFERENCE:
  491. begin
  492. reference_reset_base(ref,location^.reference.index,location^.reference.offset,paraloc.alignment);
  493. { doubles in softemu mode have a strange order of registers and references }
  494. if location^.size=OS_32 then
  495. g_concatcopy(list,tmpref,ref,4)
  496. else
  497. begin
  498. g_concatcopy(list,tmpref,ref,sizeleft);
  499. if assigned(location^.next) then
  500. internalerror(2005010710);
  501. end;
  502. end;
  503. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  504. case location^.size of
  505. OS_F32, OS_F64:
  506. a_loadfpu_ref_reg(list,location^.size,location^.size,tmpref,location^.register);
  507. else
  508. internalerror(2002072801);
  509. end;
  510. LOC_VOID:
  511. begin
  512. // nothing to do
  513. end;
  514. else
  515. internalerror(2002081103);
  516. end;
  517. inc(tmpref.offset,tcgsize2size[location^.size]);
  518. dec(sizeleft,tcgsize2size[location^.size]);
  519. location := location^.next;
  520. end;
  521. end;
  522. procedure tbasecgarm.a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const paraloc : TCGPara);
  523. var
  524. ref: treference;
  525. tmpreg: tregister;
  526. begin
  527. paraloc.check_simple_location;
  528. paramanager.allocparaloc(list,paraloc.location);
  529. case paraloc.location^.loc of
  530. LOC_REGISTER,LOC_CREGISTER:
  531. a_loadaddr_ref_reg(list,r,paraloc.location^.register);
  532. LOC_REFERENCE:
  533. begin
  534. reference_reset(ref,paraloc.alignment);
  535. ref.base := paraloc.location^.reference.index;
  536. ref.offset := paraloc.location^.reference.offset;
  537. tmpreg := getintregister(list,OS_ADDR);
  538. a_loadaddr_ref_reg(list,r,tmpreg);
  539. a_load_reg_ref(list,OS_ADDR,OS_ADDR,tmpreg,ref);
  540. end;
  541. else
  542. internalerror(2002080701);
  543. end;
  544. end;
  545. procedure tbasecgarm.a_call_name(list : TAsmList;const s : string; weak: boolean);
  546. var
  547. branchopcode: tasmop;
  548. r : treference;
  549. sym : TAsmSymbol;
  550. begin
  551. { check not really correct: should only be used for non-Thumb cpus }
  552. if (CPUARM_HAS_BLX_LABEL in cpu_capabilities[current_settings.cputype]) and
  553. { WinCE GNU AS (not sure if this applies in general) does not support BLX imm }
  554. (target_info.system<>system_arm_wince) then
  555. branchopcode:=A_BLX
  556. else
  557. branchopcode:=A_BL;
  558. if not(weak) then
  559. sym:=current_asmdata.RefAsmSymbol(s)
  560. else
  561. sym:=current_asmdata.WeakRefAsmSymbol(s);
  562. reference_reset_symbol(r,sym,0,sizeof(pint));
  563. if (tf_pic_uses_got in target_info.flags) and
  564. (cs_create_pic in current_settings.moduleswitches) then
  565. begin
  566. r.refaddr:=addr_pic
  567. end
  568. else
  569. r.refaddr:=addr_full;
  570. list.concat(taicpu.op_ref(branchopcode,r));
  571. {
  572. the compiler does not properly set this flag anymore in pass 1, and
  573. for now we only need it after pass 2 (I hope) (JM)
  574. if not(pi_do_call in current_procinfo.flags) then
  575. internalerror(2003060703);
  576. }
  577. include(current_procinfo.flags,pi_do_call);
  578. end;
  579. procedure tbasecgarm.a_call_reg(list : TAsmList;reg: tregister);
  580. begin
  581. { check not really correct: should only be used for non-Thumb cpus }
  582. if not(CPUARM_HAS_BLX in cpu_capabilities[current_settings.cputype]) then
  583. begin
  584. list.concat(taicpu.op_reg_reg(A_MOV,NR_R14,NR_PC));
  585. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,reg));
  586. end
  587. else
  588. list.concat(taicpu.op_reg(A_BLX, reg));
  589. {
  590. the compiler does not properly set this flag anymore in pass 1, and
  591. for now we only need it after pass 2 (I hope) (JM)
  592. if not(pi_do_call in current_procinfo.flags) then
  593. internalerror(2003060703);
  594. }
  595. include(current_procinfo.flags,pi_do_call);
  596. end;
  597. procedure tcgarm.a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister);
  598. begin
  599. a_op_const_reg_reg(list,op,size,a,reg,reg);
  600. end;
  601. procedure tcgarm.a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference);
  602. var
  603. tmpreg,tmpresreg : tregister;
  604. tmpref : treference;
  605. begin
  606. tmpreg:=getintregister(list,size);
  607. tmpresreg:=getintregister(list,size);
  608. tmpref:=a_internal_load_ref_reg(list,size,size,ref,tmpreg);
  609. a_op_const_reg_reg(list,op,size,a,tmpreg,tmpresreg);
  610. a_load_reg_ref(list,size,size,tmpresreg,tmpref);
  611. end;
  612. procedure tcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  613. var
  614. so : tshifterop;
  615. begin
  616. if op = OP_NEG then
  617. begin
  618. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,src,0));
  619. maybeadjustresult(list,OP_NEG,size,dst);
  620. end
  621. else if op = OP_NOT then
  622. begin
  623. if size in [OS_8, OS_16, OS_S8, OS_S16] then
  624. begin
  625. shifterop_reset(so);
  626. so.shiftmode:=SM_LSL;
  627. if size in [OS_8, OS_S8] then
  628. so.shiftimm:=24
  629. else
  630. so.shiftimm:=16;
  631. list.concat(taicpu.op_reg_reg_shifterop(A_MVN,dst,src,so));
  632. {Using a shift here allows this to be folded into another instruction}
  633. if size in [OS_S8, OS_S16] then
  634. so.shiftmode:=SM_ASR
  635. else
  636. so.shiftmode:=SM_LSR;
  637. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  638. end
  639. else
  640. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  641. end
  642. else
  643. a_op_reg_reg_reg(list,op,size,src,dst,dst);
  644. end;
  645. const
  646. op_reg_reg_opcg2asmop: array[TOpCG] of tasmop =
  647. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  648. A_NONE,A_NONE,A_NONE,A_SUB,A_EOR,A_NONE,A_NONE);
  649. op_reg_opcg2asmop: array[TOpCG] of tasmop =
  650. (A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MUL,A_MUL,A_NONE,A_NONE,A_ORR,
  651. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  652. op_reg_postfix: array[TOpCG] of TOpPostfix =
  653. (PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,
  654. PF_None,PF_None,PF_None,PF_None,PF_None,PF_None,PF_None);
  655. procedure tcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg;
  656. size: tcgsize; a: tcgint; src, dst: tregister);
  657. var
  658. ovloc : tlocation;
  659. begin
  660. a_op_const_reg_reg_checkoverflow(list,op,size,a,src,dst,false,ovloc);
  661. end;
  662. procedure tcgarm.a_op_reg_reg_reg(list: TAsmList; op: TOpCg;
  663. size: tcgsize; src1, src2, dst: tregister);
  664. var
  665. ovloc : tlocation;
  666. begin
  667. a_op_reg_reg_reg_checkoverflow(list,op,size,src1,src2,dst,false,ovloc);
  668. end;
  669. function opshift2shiftmode(op: TOpCg): tshiftmode;
  670. begin
  671. case op of
  672. OP_SHL: Result:=SM_LSL;
  673. OP_SHR: Result:=SM_LSR;
  674. OP_ROR: Result:=SM_ROR;
  675. OP_ROL: Result:=SM_ROR;
  676. OP_SAR: Result:=SM_ASR;
  677. else internalerror(2012070501);
  678. end
  679. end;
  680. function tbasecgarm.try_optimized_mul32_const_reg_reg(list: TAsmList; a: tcgint; src, dst: tregister) : boolean;
  681. var
  682. multiplier : dword;
  683. power : longint;
  684. shifterop : tshifterop;
  685. bitsset : byte;
  686. negative : boolean;
  687. first : boolean;
  688. b,
  689. cycles : byte;
  690. maxeffort : byte;
  691. begin
  692. result:=true;
  693. cycles:=0;
  694. negative:=a<0;
  695. shifterop.rs:=NR_NO;
  696. shifterop.shiftmode:=SM_LSL;
  697. if negative then
  698. inc(cycles);
  699. multiplier:=dword(abs(a));
  700. bitsset:=popcnt(multiplier and $fffffffe);
  701. { heuristics to estimate how much instructions are reasonable to replace the mul,
  702. this is currently based on XScale timings }
  703. { in the simplest case, we need a mov to load the constant and a mul to carry out the
  704. actual multiplication, this requires min. 1+4 cycles
  705. because the first shift imm. might cause a stall and because we need more instructions
  706. when replacing the mul we generate max. 3 instructions to replace this mul }
  707. maxeffort:=3;
  708. { if the constant is not a shifter op, we need either some mov/mvn/bic/or sequence or
  709. a ldr, so generating one more operation to replace this is beneficial }
  710. if not(is_shifter_const(dword(a),b)) and not(is_shifter_const(not(dword(a)),b)) then
  711. inc(maxeffort);
  712. { if the upper 5 bits are all set or clear, mul is one cycle faster }
  713. if ((dword(a) and $f8000000)=0) or ((dword(a) and $f8000000)=$f8000000) then
  714. dec(maxeffort);
  715. { if the upper 17 bits are all set or clear, mul is another cycle faster }
  716. if ((dword(a) and $ffff8000)=0) or ((dword(a) and $ffff8000)=$ffff8000) then
  717. dec(maxeffort);
  718. { most simple cases }
  719. if a=1 then
  720. a_load_reg_reg(list,OS_32,OS_32,src,dst)
  721. else if a=0 then
  722. a_load_const_reg(list,OS_32,0,dst)
  723. else if a=-1 then
  724. a_op_reg_reg(list,OP_NEG,OS_32,src,dst)
  725. { add up ?
  726. basically, one add is needed for each bit being set in the constant factor
  727. however, the least significant bit is for free, it can be hidden in the initial
  728. instruction
  729. }
  730. else if (bitsset+cycles<=maxeffort) and
  731. (bitsset<=popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)) then
  732. begin
  733. first:=true;
  734. while multiplier<>0 do
  735. begin
  736. shifterop.shiftimm:=BsrDWord(multiplier);
  737. if odd(multiplier) then
  738. begin
  739. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,shifterop));
  740. dec(multiplier);
  741. end
  742. else
  743. if first then
  744. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  745. else
  746. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,src,shifterop));
  747. first:=false;
  748. dec(multiplier,1 shl shifterop.shiftimm);
  749. end;
  750. if negative then
  751. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  752. end
  753. { subtract from the next greater power of two? }
  754. else if popcnt(dword(nextpowerof2(multiplier,power)-multiplier) and $fffffffe)+cycles+1<=maxeffort then
  755. begin
  756. first:=true;
  757. while multiplier<>0 do
  758. begin
  759. if first then
  760. begin
  761. multiplier:=(1 shl power)-multiplier;
  762. shifterop.shiftimm:=power;
  763. end
  764. else
  765. shifterop.shiftimm:=BsrDWord(multiplier);
  766. if odd(multiplier) then
  767. begin
  768. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,shifterop));
  769. dec(multiplier);
  770. end
  771. else
  772. if first then
  773. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,shifterop))
  774. else
  775. begin
  776. list.concat(taicpu.op_reg_reg_reg_shifterop(A_SUB,dst,dst,src,shifterop));
  777. dec(multiplier,1 shl shifterop.shiftimm);
  778. end;
  779. first:=false;
  780. end;
  781. if negative then
  782. list.concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,0));
  783. end
  784. else
  785. result:=false;
  786. end;
  787. procedure tcgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  788. var
  789. shift, lsb, width : byte;
  790. tmpreg : tregister;
  791. so : tshifterop;
  792. l1 : longint;
  793. imm1, imm2: DWord;
  794. begin
  795. optimize_op_const(size, op, a);
  796. case op of
  797. OP_NONE:
  798. begin
  799. if src <> dst then
  800. a_load_reg_reg(list, size, size, src, dst);
  801. exit;
  802. end;
  803. OP_MOVE:
  804. begin
  805. a_load_const_reg(list, size, a, dst);
  806. exit;
  807. end;
  808. end;
  809. ovloc.loc:=LOC_VOID;
  810. if {$ifopt R+}(a<>-2147483648) and{$endif} not setflags and is_shifter_const(-a,shift) then
  811. case op of
  812. OP_ADD:
  813. begin
  814. op:=OP_SUB;
  815. a:=aint(dword(-a));
  816. end;
  817. OP_SUB:
  818. begin
  819. op:=OP_ADD;
  820. a:=aint(dword(-a));
  821. end
  822. end;
  823. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  824. case op of
  825. OP_NEG,OP_NOT:
  826. internalerror(200308281);
  827. OP_SHL,
  828. OP_SHR,
  829. OP_ROL,
  830. OP_ROR,
  831. OP_SAR:
  832. begin
  833. if a>32 then
  834. internalerror(200308294);
  835. shifterop_reset(so);
  836. so.shiftmode:=opshift2shiftmode(op);
  837. if op = OP_ROL then
  838. so.shiftimm:=32-a
  839. else
  840. so.shiftimm:=a;
  841. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  842. end;
  843. else
  844. {if (op in [OP_SUB, OP_ADD]) and
  845. ((a < 0) or
  846. (a > 4095)) then
  847. begin
  848. tmpreg:=getintregister(list,size);
  849. list.concat(taicpu.op_reg_const(A_MOVT, tmpreg, (a shr 16) and $FFFF));
  850. list.concat(taicpu.op_reg_const(A_MOV, tmpreg, a and $FFFF));
  851. list.concat(setoppostfix(taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))
  852. ));
  853. end
  854. else}
  855. begin
  856. if cgsetflags or setflags then
  857. a_reg_alloc(list,NR_DEFAULTFLAGS);
  858. list.concat(setoppostfix(
  859. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  860. end;
  861. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  862. begin
  863. ovloc.loc:=LOC_FLAGS;
  864. case op of
  865. OP_ADD:
  866. ovloc.resflags:=F_CS;
  867. OP_SUB:
  868. ovloc.resflags:=F_CC;
  869. end;
  870. end;
  871. end
  872. else
  873. begin
  874. { there could be added some more sophisticated optimizations }
  875. if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  876. a_op_reg_reg(list,OP_NEG,size,src,dst)
  877. { we do this here instead in the peephole optimizer because
  878. it saves us a register }
  879. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  880. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  881. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  882. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  883. begin
  884. if l1>32 then{roozbeh does this ever happen?}
  885. internalerror(200308296);
  886. shifterop_reset(so);
  887. so.shiftmode:=SM_LSL;
  888. so.shiftimm:=l1;
  889. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  890. end
  891. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  892. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  893. begin
  894. if l1>32 then{does this ever happen?}
  895. internalerror(201205181);
  896. shifterop_reset(so);
  897. so.shiftmode:=SM_LSL;
  898. so.shiftimm:=l1;
  899. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  900. end
  901. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  902. begin
  903. { nothing to do on success }
  904. end
  905. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  906. broader range of shifterconstants.}
  907. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  908. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  909. { Doing two shifts instead of two bics might allow the peephole optimizer to fold the second shift
  910. into the following instruction}
  911. else if (op = OP_AND) and
  912. is_continuous_mask(a, lsb, width) and
  913. ((lsb = 0) or ((lsb + width) = 32)) then
  914. begin
  915. shifterop_reset(so);
  916. if (width = 16) and
  917. (lsb = 0) and
  918. (current_settings.cputype >= cpu_armv6) then
  919. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  920. else if (width = 8) and
  921. (lsb = 0) and
  922. (current_settings.cputype >= cpu_armv6) then
  923. list.concat(taicpu.op_reg_reg(A_UXTB,dst,src))
  924. else if lsb = 0 then
  925. begin
  926. so.shiftmode:=SM_LSL;
  927. so.shiftimm:=32-width;
  928. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  929. so.shiftmode:=SM_LSR;
  930. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  931. end
  932. else
  933. begin
  934. so.shiftmode:=SM_LSR;
  935. so.shiftimm:=lsb;
  936. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  937. so.shiftmode:=SM_LSL;
  938. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,dst,so));
  939. end;
  940. end
  941. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  942. begin
  943. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,imm1));
  944. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  945. end
  946. else if (op in [OP_ADD, OP_SUB, OP_OR, OP_XOR]) and
  947. not(cgsetflags or setflags) and
  948. split_into_shifter_const(a, imm1, imm2) then
  949. begin
  950. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,imm1));
  951. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  952. end
  953. else
  954. begin
  955. tmpreg:=getintregister(list,size);
  956. a_load_const_reg(list,size,a,tmpreg);
  957. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  958. end;
  959. end;
  960. maybeadjustresult(list,op,size,dst);
  961. end;
  962. procedure tcgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  963. var
  964. so : tshifterop;
  965. tmpreg,overflowreg : tregister;
  966. asmop : tasmop;
  967. begin
  968. ovloc.loc:=LOC_VOID;
  969. case op of
  970. OP_NEG,OP_NOT,
  971. OP_DIV,OP_IDIV:
  972. internalerror(200308283);
  973. OP_SHL,
  974. OP_SHR,
  975. OP_SAR,
  976. OP_ROR:
  977. begin
  978. if (op = OP_ROR) and not(size in [OS_32,OS_S32]) then
  979. internalerror(2008072801);
  980. shifterop_reset(so);
  981. so.rs:=src1;
  982. so.shiftmode:=opshift2shiftmode(op);
  983. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  984. end;
  985. OP_ROL:
  986. begin
  987. if not(size in [OS_32,OS_S32]) then
  988. internalerror(2008072801);
  989. { simulate ROL by ror'ing 32-value }
  990. tmpreg:=getintregister(list,OS_32);
  991. list.concat(taicpu.op_reg_reg_const(A_RSB,tmpreg,src1, 32));
  992. shifterop_reset(so);
  993. so.rs:=tmpreg;
  994. so.shiftmode:=SM_ROR;
  995. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src2,so));
  996. end;
  997. OP_IMUL,
  998. OP_MUL:
  999. begin
  1000. if (cgsetflags or setflags) and
  1001. (CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype]) then
  1002. begin
  1003. overflowreg:=getintregister(list,size);
  1004. if op=OP_IMUL then
  1005. asmop:=A_SMULL
  1006. else
  1007. asmop:=A_UMULL;
  1008. { the arm doesn't allow that rd and rm are the same }
  1009. if dst=src2 then
  1010. begin
  1011. if dst<>src1 then
  1012. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  1013. else
  1014. begin
  1015. tmpreg:=getintregister(list,size);
  1016. a_load_reg_reg(list,size,size,src2,dst);
  1017. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  1018. end;
  1019. end
  1020. else
  1021. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  1022. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1023. if op=OP_IMUL then
  1024. begin
  1025. shifterop_reset(so);
  1026. so.shiftmode:=SM_ASR;
  1027. so.shiftimm:=31;
  1028. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  1029. end
  1030. else
  1031. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  1032. ovloc.loc:=LOC_FLAGS;
  1033. ovloc.resflags:=F_NE;
  1034. end
  1035. else
  1036. begin
  1037. { the arm doesn't allow that rd and rm are the same }
  1038. if dst=src2 then
  1039. begin
  1040. if dst<>src1 then
  1041. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  1042. else
  1043. begin
  1044. tmpreg:=getintregister(list,size);
  1045. a_load_reg_reg(list,size,size,src2,dst);
  1046. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  1047. end;
  1048. end
  1049. else
  1050. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  1051. end;
  1052. end;
  1053. else
  1054. begin
  1055. if cgsetflags or setflags then
  1056. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1057. list.concat(setoppostfix(
  1058. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  1059. end;
  1060. end;
  1061. maybeadjustresult(list,op,size,dst);
  1062. end;
  1063. procedure tcgarm.a_mul_reg_reg_pair(list: tasmlist; size: tcgsize; src1,src2,dstlo,dsthi: tregister);
  1064. var
  1065. asmop: tasmop;
  1066. begin
  1067. if CPUARM_HAS_UMULL in cpu_capabilities[current_settings.cputype] then
  1068. begin
  1069. list.concat(tai_comment.create(strpnew('tcgarm.a_mul_reg_reg_pair called')));
  1070. case size of
  1071. OS_32: asmop:=A_UMULL;
  1072. OS_S32: asmop:=A_SMULL;
  1073. else
  1074. InternalError(2014060802);
  1075. end;
  1076. { The caller might omit dstlo or dsthi, when he is not interested in it, we still
  1077. need valid registers everywhere. In case of dsthi = NR_NO we could fall back to
  1078. 32x32=32 bit multiplication}
  1079. if (dstlo = NR_NO) then
  1080. dstlo:=getintregister(list,size);
  1081. if (dsthi = NR_NO) then
  1082. dsthi:=getintregister(list,size);
  1083. list.concat(taicpu.op_reg_reg_reg_reg(asmop, dstlo, dsthi, src1,src2));
  1084. end
  1085. else if dsthi=NR_NO then
  1086. begin
  1087. if (dstlo = NR_NO) then
  1088. dstlo:=getintregister(list,size);
  1089. list.concat(taicpu.op_reg_reg_reg(A_MUL, dstlo, src1,src2));
  1090. end
  1091. else
  1092. begin
  1093. internalerror(2015083022);
  1094. end;
  1095. end;
  1096. function tbasecgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  1097. var
  1098. tmpreg1,tmpreg2 : tregister;
  1099. tmpref : treference;
  1100. l : tasmlabel;
  1101. begin
  1102. tmpreg1:=NR_NO;
  1103. { Be sure to have a base register }
  1104. if (ref.base=NR_NO) then
  1105. begin
  1106. if ref.shiftmode<>SM_None then
  1107. internalerror(2014020701);
  1108. ref.base:=ref.index;
  1109. ref.index:=NR_NO;
  1110. end;
  1111. { absolute symbols can't be handled directly, we've to store the symbol reference
  1112. in the text segment and access it pc relative
  1113. For now, we assume that references where base or index equals to PC are already
  1114. relative, all other references are assumed to be absolute and thus they need
  1115. to be handled extra.
  1116. A proper solution would be to change refoptions to a set and store the information
  1117. if the symbol is absolute or relative there.
  1118. }
  1119. if (assigned(ref.symbol) and
  1120. not(is_pc(ref.base)) and
  1121. not(is_pc(ref.index))
  1122. ) or
  1123. { [#xxx] isn't a valid address operand }
  1124. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  1125. (ref.offset<-4095) or
  1126. (ref.offset>4095) or
  1127. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  1128. ((ref.offset<-255) or
  1129. (ref.offset>255)
  1130. )
  1131. ) or
  1132. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1133. ((ref.offset<-1020) or
  1134. (ref.offset>1020) or
  1135. ((abs(ref.offset) mod 4)<>0)
  1136. )
  1137. ) or
  1138. ((GenerateThumbCode) and
  1139. (((oppostfix in [PF_SB,PF_SH]) and (ref.offset<>0)) or
  1140. ((oppostfix=PF_None) and ((ref.offset<0) or ((ref.base<>NR_STACK_POINTER_REG) and (ref.offset>124)) or
  1141. ((ref.base=NR_STACK_POINTER_REG) and (ref.offset>1020)) or ((ref.offset mod 4)<>0))) or
  1142. ((oppostfix=PF_H) and ((ref.offset<0) or (ref.offset>62) or ((ref.offset mod 2)<>0) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0)))) or
  1143. ((oppostfix=PF_B) and ((ref.offset<0) or (ref.offset>31) or ((getsupreg(ref.base) in [RS_R8..RS_R15]) and (ref.offset<>0))))
  1144. )
  1145. ) then
  1146. begin
  1147. fixref(list,ref);
  1148. end;
  1149. if GenerateThumbCode then
  1150. begin
  1151. { certain thumb load require base and index }
  1152. if (oppostfix in [PF_SB,PF_SH]) and
  1153. (ref.base<>NR_NO) and (ref.index=NR_NO) then
  1154. begin
  1155. tmpreg1:=getintregister(list,OS_ADDR);
  1156. a_load_const_reg(list,OS_ADDR,0,tmpreg1);
  1157. ref.index:=tmpreg1;
  1158. end;
  1159. { "hi" registers cannot be used as base or index }
  1160. if (getsupreg(ref.base) in [RS_R8..RS_R12,RS_R14]) or
  1161. ((ref.base=NR_R13) and (ref.index<>NR_NO)) then
  1162. begin
  1163. tmpreg1:=getintregister(list,OS_ADDR);
  1164. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.base,tmpreg1);
  1165. ref.base:=tmpreg1;
  1166. end;
  1167. if getsupreg(ref.index) in [RS_R8..RS_R14] then
  1168. begin
  1169. tmpreg1:=getintregister(list,OS_ADDR);
  1170. a_load_reg_reg(list,OS_ADDR,OS_ADDR,ref.index,tmpreg1);
  1171. ref.index:=tmpreg1;
  1172. end;
  1173. end;
  1174. { fold if there is base, index and offset, however, don't fold
  1175. for vfp memory instructions because we later fold the index }
  1176. if not((op in [A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  1177. (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  1178. begin
  1179. if tmpreg1<>NR_NO then
  1180. begin
  1181. tmpreg2:=getintregister(list,OS_ADDR);
  1182. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg1,tmpreg2);
  1183. tmpreg1:=tmpreg2;
  1184. end
  1185. else
  1186. begin
  1187. tmpreg1:=getintregister(list,OS_ADDR);
  1188. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg1);
  1189. ref.base:=tmpreg1;
  1190. end;
  1191. ref.offset:=0;
  1192. end;
  1193. { floating point operations have only limited references
  1194. we expect here, that a base is already set }
  1195. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  1196. begin
  1197. if ref.shiftmode<>SM_none then
  1198. internalerror(200309121);
  1199. if tmpreg1<>NR_NO then
  1200. begin
  1201. if ref.base=tmpreg1 then
  1202. begin
  1203. if ref.signindex<0 then
  1204. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,tmpreg1,ref.index))
  1205. else
  1206. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,tmpreg1,ref.index));
  1207. ref.index:=NR_NO;
  1208. end
  1209. else
  1210. begin
  1211. if ref.index<>tmpreg1 then
  1212. internalerror(200403161);
  1213. if ref.signindex<0 then
  1214. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg1,ref.base,tmpreg1))
  1215. else
  1216. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,tmpreg1));
  1217. ref.base:=tmpreg1;
  1218. ref.index:=NR_NO;
  1219. end;
  1220. end
  1221. else
  1222. begin
  1223. tmpreg1:=getintregister(list,OS_ADDR);
  1224. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg1,ref.base,ref.index));
  1225. ref.base:=tmpreg1;
  1226. ref.index:=NR_NO;
  1227. end;
  1228. end;
  1229. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  1230. Result := ref;
  1231. end;
  1232. procedure tbasecgarm.a_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference);
  1233. var
  1234. oppostfix:toppostfix;
  1235. usedtmpref: treference;
  1236. tmpreg : tregister;
  1237. dir : integer;
  1238. begin
  1239. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  1240. FromSize := ToSize;
  1241. case ToSize of
  1242. { signed integer registers }
  1243. OS_8,
  1244. OS_S8:
  1245. oppostfix:=PF_B;
  1246. OS_16,
  1247. OS_S16:
  1248. oppostfix:=PF_H;
  1249. OS_32,
  1250. OS_S32,
  1251. { for vfp value stored in integer register }
  1252. OS_F32:
  1253. oppostfix:=PF_None;
  1254. else
  1255. InternalError(200308299);
  1256. end;
  1257. if ((ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[tosize])) or
  1258. ((not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) and
  1259. (oppostfix =PF_H)) then
  1260. begin
  1261. if target_info.endian=endian_big then
  1262. dir:=-1
  1263. else
  1264. dir:=1;
  1265. case FromSize of
  1266. OS_16,OS_S16:
  1267. begin
  1268. tmpreg:=getintregister(list,OS_INT);
  1269. usedtmpref:=ref;
  1270. if target_info.endian=endian_big then
  1271. inc(usedtmpref.offset,1);
  1272. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1273. inc(usedtmpref.offset,dir);
  1274. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1275. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1276. end;
  1277. OS_32,OS_S32:
  1278. begin
  1279. tmpreg:=getintregister(list,OS_INT);
  1280. usedtmpref:=ref;
  1281. if ref.alignment=2 then
  1282. begin
  1283. if target_info.endian=endian_big then
  1284. inc(usedtmpref.offset,2);
  1285. usedtmpref:=a_internal_load_reg_ref(list,OS_16,OS_16,reg,usedtmpref);
  1286. a_op_const_reg_reg(list,OP_SHR,OS_INT,16,reg,tmpreg);
  1287. inc(usedtmpref.offset,dir*2);
  1288. a_internal_load_reg_ref(list,OS_16,OS_16,tmpreg,usedtmpref);
  1289. end
  1290. else
  1291. begin
  1292. if target_info.endian=endian_big then
  1293. inc(usedtmpref.offset,3);
  1294. usedtmpref:=a_internal_load_reg_ref(list,OS_8,OS_8,reg,usedtmpref);
  1295. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1296. inc(usedtmpref.offset,dir);
  1297. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1298. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1299. inc(usedtmpref.offset,dir);
  1300. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1301. a_op_const_reg(list,OP_SHR,OS_INT,8,tmpreg);
  1302. inc(usedtmpref.offset,dir);
  1303. a_internal_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref);
  1304. end;
  1305. end
  1306. else
  1307. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1308. end;
  1309. end
  1310. else
  1311. handle_load_store(list,A_STR,oppostfix,reg,ref);
  1312. end;
  1313. function tbasecgarm.a_internal_load_reg_ref(list : TAsmList; fromsize, tosize: tcgsize; reg : tregister;const ref : treference):treference;
  1314. var
  1315. oppostfix:toppostfix;
  1316. href: treference;
  1317. tmpreg: TRegister;
  1318. begin
  1319. case ToSize of
  1320. { signed integer registers }
  1321. OS_8,
  1322. OS_S8:
  1323. oppostfix:=PF_B;
  1324. OS_16,
  1325. OS_S16:
  1326. oppostfix:=PF_H;
  1327. OS_32,
  1328. OS_S32:
  1329. oppostfix:=PF_None;
  1330. else
  1331. InternalError(2003082910);
  1332. end;
  1333. if (tosize in [OS_S16,OS_16]) and
  1334. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1335. begin
  1336. result:=handle_load_store(list,A_STR,PF_B,reg,ref);
  1337. tmpreg:=getintregister(list,OS_INT);
  1338. a_op_const_reg_reg(list,OP_SHR,OS_INT,8,reg,tmpreg);
  1339. href:=result;
  1340. inc(href.offset);
  1341. handle_load_store(list,A_STR,PF_B,tmpreg,href);
  1342. end
  1343. else
  1344. result:=handle_load_store(list,A_STR,oppostfix,reg,ref);
  1345. end;
  1346. function tbasecgarm.a_internal_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister):treference;
  1347. var
  1348. oppostfix:toppostfix;
  1349. so: tshifterop;
  1350. tmpreg: TRegister;
  1351. href: treference;
  1352. begin
  1353. case FromSize of
  1354. { signed integer registers }
  1355. OS_8:
  1356. oppostfix:=PF_B;
  1357. OS_S8:
  1358. oppostfix:=PF_SB;
  1359. OS_16:
  1360. oppostfix:=PF_H;
  1361. OS_S16:
  1362. oppostfix:=PF_SH;
  1363. OS_32,
  1364. OS_S32:
  1365. oppostfix:=PF_None;
  1366. else
  1367. InternalError(200308291);
  1368. end;
  1369. if (tosize=OS_S8) and
  1370. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1371. begin
  1372. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1373. a_load_reg_reg(list,OS_S8,OS_32,reg,reg);
  1374. end
  1375. else if (tosize in [OS_S16,OS_16]) and
  1376. (not (CPUARM_HAS_ALL_MEM in cpu_capabilities[current_settings.cputype])) then
  1377. begin
  1378. result:=handle_load_store(list,A_LDR,PF_B,reg,ref);
  1379. tmpreg:=getintregister(list,OS_INT);
  1380. href:=result;
  1381. inc(href.offset);
  1382. handle_load_store(list,A_LDR,PF_B,tmpreg,href);
  1383. shifterop_reset(so);
  1384. so.shiftmode:=SM_LSL;
  1385. so.shiftimm:=8;
  1386. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  1387. end
  1388. else
  1389. result:=handle_load_store(list,A_LDR,oppostfix,reg,ref);
  1390. end;
  1391. procedure tbasecgarm.a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);
  1392. var
  1393. so : tshifterop;
  1394. procedure do_shift(shiftmode : tshiftmode; shiftimm : byte; reg : tregister);
  1395. begin
  1396. if GenerateThumbCode then
  1397. begin
  1398. case shiftmode of
  1399. SM_ASR:
  1400. a_op_const_reg_reg(list,OP_SAR,OS_32,shiftimm,reg,reg2);
  1401. SM_LSR:
  1402. a_op_const_reg_reg(list,OP_SHR,OS_32,shiftimm,reg,reg2);
  1403. SM_LSL:
  1404. a_op_const_reg_reg(list,OP_SHL,OS_32,shiftimm,reg,reg2);
  1405. else
  1406. internalerror(2013090301);
  1407. end;
  1408. end
  1409. else
  1410. begin
  1411. so.shiftmode:=shiftmode;
  1412. so.shiftimm:=shiftimm;
  1413. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,reg2,reg,so));
  1414. end;
  1415. end;
  1416. var
  1417. instr: taicpu;
  1418. conv_done: boolean;
  1419. begin
  1420. if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then
  1421. internalerror(2002090901);
  1422. conv_done:=false;
  1423. if tosize<>fromsize then
  1424. begin
  1425. shifterop_reset(so);
  1426. conv_done:=true;
  1427. if tcgsize2size[tosize]<=tcgsize2size[fromsize] then
  1428. fromsize:=tosize;
  1429. if current_settings.cputype<cpu_armv6 then
  1430. case fromsize of
  1431. OS_8:
  1432. if GenerateThumbCode then
  1433. a_op_const_reg_reg(list,OP_AND,OS_32,$ff,reg1,reg2)
  1434. else
  1435. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1436. OS_S8:
  1437. begin
  1438. do_shift(SM_LSL,24,reg1);
  1439. if tosize=OS_16 then
  1440. begin
  1441. do_shift(SM_ASR,8,reg2);
  1442. do_shift(SM_LSR,16,reg2);
  1443. end
  1444. else
  1445. do_shift(SM_ASR,24,reg2);
  1446. end;
  1447. OS_16:
  1448. begin
  1449. do_shift(SM_LSL,16,reg1);
  1450. do_shift(SM_LSR,16,reg2);
  1451. end;
  1452. OS_S16:
  1453. begin
  1454. do_shift(SM_LSL,16,reg1);
  1455. do_shift(SM_ASR,16,reg2)
  1456. end;
  1457. else
  1458. conv_done:=false;
  1459. end
  1460. else
  1461. case fromsize of
  1462. OS_8:
  1463. if GenerateThumbCode then
  1464. list.concat(taicpu.op_reg_reg(A_UXTB,reg2,reg1))
  1465. else
  1466. list.concat(taicpu.op_reg_reg_const(A_AND,reg2,reg1,$ff));
  1467. OS_S8:
  1468. begin
  1469. if tosize=OS_16 then
  1470. begin
  1471. so.shiftmode:=SM_ROR;
  1472. so.shiftimm:=16;
  1473. list.concat(taicpu.op_reg_reg_shifterop(A_SXTB16,reg2,reg1,so));
  1474. do_shift(SM_LSR,16,reg2);
  1475. end
  1476. else
  1477. list.concat(taicpu.op_reg_reg(A_SXTB,reg2,reg1));
  1478. end;
  1479. OS_16:
  1480. list.concat(taicpu.op_reg_reg(A_UXTH,reg2,reg1));
  1481. OS_S16:
  1482. list.concat(taicpu.op_reg_reg(A_SXTH,reg2,reg1));
  1483. else
  1484. conv_done:=false;
  1485. end
  1486. end;
  1487. if not conv_done and (reg1<>reg2) then
  1488. begin
  1489. { same size, only a register mov required }
  1490. instr:=taicpu.op_reg_reg(A_MOV,reg2,reg1);
  1491. list.Concat(instr);
  1492. { Notify the register allocator that we have written a move instruction so
  1493. it can try to eliminate it. }
  1494. add_move_instruction(instr);
  1495. end;
  1496. end;
  1497. procedure tbasecgarm.a_loadfpu_ref_cgpara(list : TAsmList;size : tcgsize;const ref : treference;const paraloc : TCGPara);
  1498. var
  1499. href,href2 : treference;
  1500. hloc : pcgparalocation;
  1501. begin
  1502. href:=ref;
  1503. hloc:=paraloc.location;
  1504. while assigned(hloc) do
  1505. begin
  1506. case hloc^.loc of
  1507. LOC_FPUREGISTER,LOC_CFPUREGISTER:
  1508. begin
  1509. paramanager.allocparaloc(list,paraloc.location);
  1510. a_loadfpu_ref_reg(list,size,size,ref,hloc^.register);
  1511. end;
  1512. LOC_REGISTER :
  1513. case hloc^.size of
  1514. OS_32,
  1515. OS_F32:
  1516. begin
  1517. paramanager.allocparaloc(list,paraloc.location);
  1518. a_load_ref_reg(list,OS_32,OS_32,href,hloc^.register);
  1519. end;
  1520. OS_64,
  1521. OS_F64:
  1522. cg64.a_load64_ref_cgpara(list,href,paraloc);
  1523. else
  1524. a_load_ref_reg(list,hloc^.size,hloc^.size,href,hloc^.register);
  1525. end;
  1526. LOC_REFERENCE :
  1527. begin
  1528. reference_reset_base(href2,hloc^.reference.index,hloc^.reference.offset,paraloc.alignment);
  1529. { concatcopy should choose the best way to copy the data }
  1530. g_concatcopy(list,href,href2,tcgsize2size[hloc^.size]);
  1531. end;
  1532. else
  1533. internalerror(200408241);
  1534. end;
  1535. inc(href.offset,tcgsize2size[hloc^.size]);
  1536. hloc:=hloc^.next;
  1537. end;
  1538. end;
  1539. procedure tbasecgarm.a_loadfpu_reg_reg(list: TAsmList; fromsize,tosize: tcgsize; reg1, reg2: tregister);
  1540. begin
  1541. list.concat(setoppostfix(taicpu.op_reg_reg(A_MVF,reg2,reg1),cgsize2fpuoppostfix[tosize]));
  1542. end;
  1543. procedure tbasecgarm.a_loadfpu_ref_reg(list: TAsmList; fromsize,tosize: tcgsize; const ref: treference; reg: tregister);
  1544. var
  1545. oppostfix:toppostfix;
  1546. begin
  1547. case fromsize of
  1548. OS_32,
  1549. OS_F32:
  1550. oppostfix:=PF_S;
  1551. OS_64,
  1552. OS_F64:
  1553. oppostfix:=PF_D;
  1554. OS_F80:
  1555. oppostfix:=PF_E;
  1556. else
  1557. InternalError(200309021);
  1558. end;
  1559. handle_load_store(list,A_LDF,oppostfix,reg,ref);
  1560. if fromsize<>tosize then
  1561. a_loadfpu_reg_reg(list,fromsize,tosize,reg,reg);
  1562. end;
  1563. procedure tbasecgarm.a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);
  1564. var
  1565. oppostfix:toppostfix;
  1566. begin
  1567. case tosize of
  1568. OS_F32:
  1569. oppostfix:=PF_S;
  1570. OS_F64:
  1571. oppostfix:=PF_D;
  1572. OS_F80:
  1573. oppostfix:=PF_E;
  1574. else
  1575. InternalError(200309022);
  1576. end;
  1577. handle_load_store(list,A_STF,oppostfix,reg,ref);
  1578. end;
  1579. { comparison operations }
  1580. procedure tbasecgarm.a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;
  1581. l : tasmlabel);
  1582. var
  1583. tmpreg : tregister;
  1584. b : byte;
  1585. begin
  1586. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1587. if (not(GenerateThumbCode) and is_shifter_const(a,b)) or
  1588. ((GenerateThumbCode) and is_thumb_imm(a)) then
  1589. list.concat(taicpu.op_reg_const(A_CMP,reg,a))
  1590. { CMN reg,0 and CMN reg,$80000000 are different from CMP reg,$ffffffff
  1591. and CMP reg,$7fffffff regarding the flags according to the ARM manual }
  1592. else if (a<>$7fffffff) and (a<>-1) and not(GenerateThumbCode) and is_shifter_const(-a,b) then
  1593. list.concat(taicpu.op_reg_const(A_CMN,reg,-a))
  1594. else
  1595. begin
  1596. tmpreg:=getintregister(list,size);
  1597. a_load_const_reg(list,size,a,tmpreg);
  1598. list.concat(taicpu.op_reg_reg(A_CMP,reg,tmpreg));
  1599. end;
  1600. a_jmp_cond(list,cmp_op,l);
  1601. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1602. end;
  1603. procedure tbasecgarm.a_bit_scan_reg_reg(list: TAsmList; reverse: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister);
  1604. begin
  1605. if reverse then
  1606. begin
  1607. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,src));
  1608. list.Concat(taicpu.op_reg_reg_const(A_RSB,dst,dst,31));
  1609. list.Concat(taicpu.op_reg_reg_const(A_AND,dst,dst,255));
  1610. end
  1611. { it is decided during the compilation of the system unit if this code is used or not
  1612. so no additional check for rbit is needed }
  1613. else
  1614. begin
  1615. list.Concat(taicpu.op_reg_reg(A_RBIT,dst,src));
  1616. list.Concat(taicpu.op_reg_reg(A_CLZ,dst,dst));
  1617. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1618. list.Concat(taicpu.op_reg_const(A_CMP,dst,32));
  1619. if GenerateThumb2Code then
  1620. list.Concat(taicpu.op_cond(A_IT, C_EQ));
  1621. list.Concat(setcondition(taicpu.op_reg_const(A_MOV,dst,$ff),C_EQ));
  1622. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1623. end;
  1624. end;
  1625. procedure tbasecgarm.a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel);
  1626. begin
  1627. a_reg_alloc(list,NR_DEFAULTFLAGS);
  1628. list.concat(taicpu.op_reg_reg(A_CMP,reg2,reg1));
  1629. a_jmp_cond(list,cmp_op,l);
  1630. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  1631. end;
  1632. procedure tbasecgarm.a_jmp_name(list : TAsmList;const s : string);
  1633. var
  1634. ai : taicpu;
  1635. begin
  1636. { generate far jump, leave it to the optimizer to get rid of it }
  1637. if GenerateThumbCode then
  1638. ai:=taicpu.op_sym(A_BL,current_asmdata.RefAsmSymbol(s))
  1639. else
  1640. ai:=taicpu.op_sym(A_B,current_asmdata.RefAsmSymbol(s));
  1641. ai.is_jmp:=true;
  1642. list.concat(ai);
  1643. end;
  1644. procedure tbasecgarm.a_jmp_always(list : TAsmList;l: tasmlabel);
  1645. var
  1646. ai : taicpu;
  1647. begin
  1648. { generate far jump, leave it to the optimizer to get rid of it }
  1649. if GenerateThumbCode then
  1650. ai:=taicpu.op_sym(A_BL,l)
  1651. else
  1652. ai:=taicpu.op_sym(A_B,l);
  1653. ai.is_jmp:=true;
  1654. list.concat(ai);
  1655. end;
  1656. procedure tbasecgarm.a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel);
  1657. var
  1658. ai : taicpu;
  1659. inv_flags : TResFlags;
  1660. hlabel : TAsmLabel;
  1661. begin
  1662. if GenerateThumbCode then
  1663. begin
  1664. inv_flags:=f;
  1665. inverse_flags(inv_flags);
  1666. { the optimizer has to fix this if jump range is sufficient short }
  1667. current_asmdata.getjumplabel(hlabel);
  1668. ai:=setcondition(taicpu.op_sym(A_B,hlabel),flags_to_cond(inv_flags));
  1669. ai.is_jmp:=true;
  1670. list.concat(ai);
  1671. a_jmp_always(list,l);
  1672. a_label(list,hlabel);
  1673. end
  1674. else
  1675. begin
  1676. ai:=setcondition(taicpu.op_sym(A_B,l),flags_to_cond(f));
  1677. ai.is_jmp:=true;
  1678. list.concat(ai);
  1679. end;
  1680. end;
  1681. procedure tbasecgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  1682. begin
  1683. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  1684. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  1685. end;
  1686. procedure tbasecgarm.g_profilecode(list : TAsmList);
  1687. begin
  1688. if target_info.system = system_arm_linux then
  1689. begin
  1690. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R14]));
  1691. a_call_name(list,'__gnu_mcount_nc',false);
  1692. end
  1693. else
  1694. internalerror(2014091201);
  1695. end;
  1696. procedure tbasecgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  1697. var
  1698. ref : treference;
  1699. shift : byte;
  1700. firstfloatreg,lastfloatreg,
  1701. r : byte;
  1702. mmregs,
  1703. regs, saveregs : tcpuregisterset;
  1704. registerarea,
  1705. r7offset,
  1706. stackmisalignment : pint;
  1707. postfix: toppostfix;
  1708. imm1, imm2: DWord;
  1709. stack_parameters : Boolean;
  1710. begin
  1711. LocalSize:=align(LocalSize,4);
  1712. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  1713. { call instruction does not put anything on the stack }
  1714. registerarea:=0;
  1715. tarmprocinfo(current_procinfo).stackpaddingreg:=High(TSuperRegister);
  1716. lastfloatreg:=RS_NO;
  1717. if not(nostackframe) then
  1718. begin
  1719. firstfloatreg:=RS_NO;
  1720. mmregs:=[];
  1721. case current_settings.fputype of
  1722. fpu_fpa,
  1723. fpu_fpa10,
  1724. fpu_fpa11:
  1725. begin
  1726. { save floating point registers? }
  1727. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1728. for r:=RS_F0 to RS_F7 do
  1729. if r in regs then
  1730. begin
  1731. if firstfloatreg=RS_NO then
  1732. firstfloatreg:=r;
  1733. lastfloatreg:=r;
  1734. inc(registerarea,12);
  1735. end;
  1736. end;
  1737. fpu_vfpv2,
  1738. fpu_vfpv3,
  1739. fpu_vfpv3_d16:
  1740. begin;
  1741. mmregs:=rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall);
  1742. end;
  1743. end;
  1744. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1745. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1746. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  1747. { save int registers }
  1748. reference_reset(ref,4);
  1749. ref.index:=NR_STACK_POINTER_REG;
  1750. ref.addressmode:=AM_PREINDEXED;
  1751. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  1752. if not(target_info.system in systems_darwin) then
  1753. begin
  1754. a_reg_alloc(list,NR_STACK_POINTER_REG);
  1755. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1756. begin
  1757. a_reg_alloc(list,NR_R12);
  1758. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  1759. end;
  1760. { the (old) ARM APCS requires saving both the stack pointer (to
  1761. crawl the stack) and the PC (to identify the function this
  1762. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  1763. and R15 -- still needs updating for EABI and Darwin, they don't
  1764. need that }
  1765. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1766. regs:=regs+[RS_FRAME_POINTER_REG,RS_R12,RS_R14,RS_R15]
  1767. else
  1768. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1769. include(regs,RS_R14);
  1770. if regs<>[] then
  1771. begin
  1772. for r:=RS_R0 to RS_R15 do
  1773. if r in regs then
  1774. inc(registerarea,4);
  1775. { if the stack is not 8 byte aligned, try to add an extra register,
  1776. so we can avoid the extra sub/add ...,#4 later (KB) }
  1777. if ((registerarea mod current_settings.alignment.localalignmax) <> 0) then
  1778. for r:=RS_R3 downto RS_R0 do
  1779. if not(r in regs) then
  1780. begin
  1781. regs:=regs+[r];
  1782. inc(registerarea,4);
  1783. tarmprocinfo(current_procinfo).stackpaddingreg:=r;
  1784. break;
  1785. end;
  1786. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  1787. end;
  1788. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  1789. begin
  1790. { the framepointer now points to the saved R15, so the saved
  1791. framepointer is at R11-12 (for get_caller_frame) }
  1792. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  1793. a_reg_dealloc(list,NR_R12);
  1794. end;
  1795. end
  1796. else
  1797. begin
  1798. { always save r14 if we use r7 as the framepointer, because
  1799. the parameter offsets are hardcoded in advance and always
  1800. assume that r14 sits on the stack right behind the saved r7
  1801. }
  1802. if current_procinfo.framepointer=NR_FRAME_POINTER_REG then
  1803. include(regs,RS_FRAME_POINTER_REG);
  1804. if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  1805. include(regs,RS_R14);
  1806. if regs<>[] then
  1807. begin
  1808. { on Darwin, you first have to save [r4-r7,lr], and then
  1809. [r8,r10,r11] and make r7 point to the previously saved
  1810. r7 so that you can perform a stack crawl based on it
  1811. ([r7] is previous stack frame, [r7+4] is return address
  1812. }
  1813. include(regs,RS_FRAME_POINTER_REG);
  1814. saveregs:=regs-[RS_R8,RS_R10,RS_R11];
  1815. r7offset:=0;
  1816. for r:=RS_R0 to RS_R15 do
  1817. if r in saveregs then
  1818. begin
  1819. inc(registerarea,4);
  1820. if r<RS_FRAME_POINTER_REG then
  1821. inc(r7offset,4);
  1822. end;
  1823. { save the registers }
  1824. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1825. { make r7 point to the saved r7 (regardless of whether this
  1826. frame uses the framepointer, for backtrace purposes) }
  1827. if r7offset<>0 then
  1828. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_FRAME_POINTER_REG,NR_R13,r7offset))
  1829. else
  1830. list.concat(taicpu.op_reg_reg(A_MOV,NR_R7,NR_R13));
  1831. { now save the rest (if any) }
  1832. saveregs:=regs-saveregs;
  1833. if saveregs<>[] then
  1834. begin
  1835. for r:=RS_R8 to RS_R11 do
  1836. if r in saveregs then
  1837. inc(registerarea,4);
  1838. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  1839. end;
  1840. end;
  1841. end;
  1842. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  1843. if (LocalSize<>0) or
  1844. ((stackmisalignment<>0) and
  1845. ((pi_do_call in current_procinfo.flags) or
  1846. (po_assembler in current_procinfo.procdef.procoptions))) then
  1847. begin
  1848. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  1849. if stack_parameters and (pi_estimatestacksize in current_procinfo.flags) then
  1850. begin
  1851. if localsize>tarmprocinfo(current_procinfo).stackframesize then
  1852. internalerror(2014030901)
  1853. else
  1854. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea;
  1855. end;
  1856. if is_shifter_const(localsize,shift) then
  1857. begin
  1858. a_reg_dealloc(list,NR_R12);
  1859. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  1860. end
  1861. else if split_into_shifter_const(localsize, imm1, imm2) then
  1862. begin
  1863. a_reg_dealloc(list,NR_R12);
  1864. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  1865. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  1866. end
  1867. else
  1868. begin
  1869. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  1870. a_reg_alloc(list,NR_R12);
  1871. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  1872. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  1873. a_reg_dealloc(list,NR_R12);
  1874. end;
  1875. end;
  1876. if (mmregs<>[]) or
  1877. (firstfloatreg<>RS_NO) then
  1878. begin
  1879. reference_reset(ref,4);
  1880. if (tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023) or
  1881. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv3_d16]) then
  1882. begin
  1883. if not is_shifter_const(tarmprocinfo(current_procinfo).floatregstart,shift) then
  1884. begin
  1885. a_reg_alloc(list,NR_R12);
  1886. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  1887. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1888. a_reg_dealloc(list,NR_R12);
  1889. end
  1890. else
  1891. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tarmprocinfo(current_procinfo).floatregstart));
  1892. ref.base:=NR_R12;
  1893. end
  1894. else
  1895. begin
  1896. ref.base:=current_procinfo.framepointer;
  1897. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  1898. end;
  1899. case current_settings.fputype of
  1900. fpu_fpa,
  1901. fpu_fpa10,
  1902. fpu_fpa11:
  1903. begin
  1904. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  1905. lastfloatreg-firstfloatreg+1,ref));
  1906. end;
  1907. fpu_vfpv2,
  1908. fpu_vfpv3,
  1909. fpu_vfpv3_d16:
  1910. begin
  1911. ref.index:=ref.base;
  1912. ref.base:=NR_NO;
  1913. { FSTMX is deprecated on ARMv6 and later }
  1914. {if (current_settings.cputype<cpu_armv6) then
  1915. postfix:=PF_IAX
  1916. else
  1917. postfix:=PF_IAD;}
  1918. list.concat(taicpu.op_ref_regset(A_VSTM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  1919. end;
  1920. end;
  1921. end;
  1922. end;
  1923. end;
  1924. procedure tbasecgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  1925. var
  1926. ref : treference;
  1927. LocalSize : longint;
  1928. firstfloatreg,lastfloatreg,
  1929. r,
  1930. shift : byte;
  1931. mmregs,
  1932. saveregs,
  1933. regs : tcpuregisterset;
  1934. registerarea,
  1935. stackmisalignment: pint;
  1936. paddingreg: TSuperRegister;
  1937. mmpostfix: toppostfix;
  1938. imm1, imm2: DWord;
  1939. begin
  1940. { Release PIC register }
  1941. if (cs_create_pic in current_settings.moduleswitches) and
  1942. (tf_pic_uses_got in target_info.flags) and
  1943. (pi_needs_got in current_procinfo.flags)
  1944. then
  1945. list.concat(tai_regalloc.dealloc(current_procinfo.got,nil));
  1946. if not(nostackframe) then
  1947. begin
  1948. registerarea:=0;
  1949. firstfloatreg:=RS_NO;
  1950. lastfloatreg:=RS_NO;
  1951. mmregs:=[];
  1952. saveregs:=[];
  1953. case current_settings.fputype of
  1954. fpu_fpa,
  1955. fpu_fpa10,
  1956. fpu_fpa11:
  1957. begin
  1958. { restore floating point registers? }
  1959. regs:=rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);
  1960. for r:=RS_F0 to RS_F7 do
  1961. if r in regs then
  1962. begin
  1963. if firstfloatreg=RS_NO then
  1964. firstfloatreg:=r;
  1965. lastfloatreg:=r;
  1966. { floating point register space is already included in
  1967. localsize below by calc_stackframe_size
  1968. inc(registerarea,12);
  1969. }
  1970. end;
  1971. end;
  1972. fpu_vfpv2,
  1973. fpu_vfpv3,
  1974. fpu_vfpv3_d16:
  1975. begin;
  1976. { restore vfp registers? }
  1977. mmregs:=rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall);
  1978. end;
  1979. end;
  1980. if (firstfloatreg<>RS_NO) or
  1981. (mmregs<>[]) then
  1982. begin
  1983. reference_reset(ref,4);
  1984. if (tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023) or
  1985. (current_settings.fputype in [fpu_vfpv2,fpu_vfpv3,fpu_vfpv3_d16]) then
  1986. begin
  1987. if not is_shifter_const(tarmprocinfo(current_procinfo).floatregstart,shift) then
  1988. begin
  1989. a_reg_alloc(list,NR_R12);
  1990. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  1991. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  1992. a_reg_dealloc(list,NR_R12);
  1993. end
  1994. else
  1995. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_R12,current_procinfo.framepointer,-tarmprocinfo(current_procinfo).floatregstart));
  1996. ref.base:=NR_R12;
  1997. end
  1998. else
  1999. begin
  2000. ref.base:=current_procinfo.framepointer;
  2001. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  2002. end;
  2003. case current_settings.fputype of
  2004. fpu_fpa,
  2005. fpu_fpa10,
  2006. fpu_fpa11:
  2007. begin
  2008. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  2009. lastfloatreg-firstfloatreg+1,ref));
  2010. end;
  2011. fpu_vfpv2,
  2012. fpu_vfpv3,
  2013. fpu_vfpv3_d16:
  2014. begin
  2015. ref.index:=ref.base;
  2016. ref.base:=NR_NO;
  2017. { FLDMX is deprecated on ARMv6 and later }
  2018. {if (current_settings.cputype<cpu_armv6) then
  2019. mmpostfix:=PF_IAX
  2020. else
  2021. mmpostfix:=PF_IAD;}
  2022. list.concat(taicpu.op_ref_regset(A_VLDM,ref,R_MMREGISTER,R_SUBFD,mmregs));
  2023. end;
  2024. end;
  2025. end;
  2026. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  2027. if (pi_do_call in current_procinfo.flags) or
  2028. (regs<>[]) or
  2029. ((target_info.system in systems_darwin) and
  2030. (current_procinfo.framepointer<>NR_STACK_POINTER_REG)) then
  2031. begin
  2032. exclude(regs,RS_R14);
  2033. include(regs,RS_R15);
  2034. if (target_info.system in systems_darwin) then
  2035. include(regs,RS_FRAME_POINTER_REG);
  2036. end;
  2037. if not(target_info.system in systems_darwin) then
  2038. begin
  2039. { restore saved stack pointer to SP (R13) and saved lr to PC (R15).
  2040. The saved PC came after that but is discarded, since we restore
  2041. the stack pointer }
  2042. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  2043. regs:=regs+[RS_FRAME_POINTER_REG,RS_R13,RS_R15];
  2044. end
  2045. else
  2046. begin
  2047. { restore R8-R11 already if necessary (they've been stored
  2048. before the others) }
  2049. saveregs:=regs*[RS_R8,RS_R10,RS_R11];
  2050. if saveregs<>[] then
  2051. begin
  2052. reference_reset(ref,4);
  2053. ref.index:=NR_STACK_POINTER_REG;
  2054. ref.addressmode:=AM_PREINDEXED;
  2055. for r:=RS_R8 to RS_R11 do
  2056. if r in saveregs then
  2057. inc(registerarea,4);
  2058. regs:=regs-saveregs;
  2059. end;
  2060. end;
  2061. for r:=RS_R0 to RS_R15 do
  2062. if r in regs then
  2063. inc(registerarea,4);
  2064. { reapply the stack padding reg, in case there was one, see the complimentary
  2065. comment in g_proc_entry() (KB) }
  2066. paddingreg:=tarmprocinfo(current_procinfo).stackpaddingreg;
  2067. if paddingreg < RS_R4 then
  2068. if paddingreg in regs then
  2069. internalerror(201306190)
  2070. else
  2071. begin
  2072. regs:=regs+[paddingreg];
  2073. inc(registerarea,4);
  2074. end;
  2075. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  2076. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  2077. (target_info.system in systems_darwin) then
  2078. begin
  2079. LocalSize:=current_procinfo.calc_stackframe_size;
  2080. if (LocalSize<>0) or
  2081. ((stackmisalignment<>0) and
  2082. ((pi_do_call in current_procinfo.flags) or
  2083. (po_assembler in current_procinfo.procdef.procoptions))) then
  2084. begin
  2085. if pi_estimatestacksize in current_procinfo.flags then
  2086. LocalSize:=tarmprocinfo(current_procinfo).stackframesize-registerarea
  2087. else
  2088. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  2089. if is_shifter_const(LocalSize,shift) then
  2090. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  2091. else if split_into_shifter_const(localsize, imm1, imm2) then
  2092. begin
  2093. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm1));
  2094. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,imm2));
  2095. end
  2096. else
  2097. begin
  2098. a_reg_alloc(list,NR_R12);
  2099. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  2100. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  2101. a_reg_dealloc(list,NR_R12);
  2102. end;
  2103. end;
  2104. if (target_info.system in systems_darwin) and
  2105. (saveregs<>[]) then
  2106. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,saveregs),PF_FD));
  2107. if regs=[] then
  2108. begin
  2109. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2110. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2111. else
  2112. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2113. end
  2114. else
  2115. begin
  2116. reference_reset(ref,4);
  2117. ref.index:=NR_STACK_POINTER_REG;
  2118. ref.addressmode:=AM_PREINDEXED;
  2119. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  2120. end;
  2121. end
  2122. else
  2123. begin
  2124. { restore int registers and return }
  2125. reference_reset(ref,4);
  2126. ref.index:=NR_FRAME_POINTER_REG;
  2127. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_EA));
  2128. end;
  2129. end
  2130. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  2131. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  2132. else
  2133. list.concat(taicpu.op_reg(A_BX,NR_R14))
  2134. end;
  2135. procedure tbasecgarm.g_maybe_got_init(list : TAsmList);
  2136. var
  2137. ref : treference;
  2138. l : TAsmLabel;
  2139. begin
  2140. if (cs_create_pic in current_settings.moduleswitches) and
  2141. (pi_needs_got in current_procinfo.flags) and
  2142. (tf_pic_uses_got in target_info.flags) then
  2143. begin
  2144. reference_reset(ref,4);
  2145. current_asmdata.getglobaldatalabel(l);
  2146. cg.a_label(current_procinfo.aktlocaldata,l);
  2147. ref.symbol:=l;
  2148. ref.base:=NR_PC;
  2149. ref.symboldata:=current_procinfo.aktlocaldata.last;
  2150. a_reg_alloc(list,NR_R12);
  2151. list.concat(Taicpu.op_reg_ref(A_LDR,NR_R12,ref));
  2152. current_asmdata.getaddrlabel(l);
  2153. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_32bit,l,current_asmdata.RefAsmSymbol('_GLOBAL_OFFSET_TABLE_'),-8));
  2154. cg.a_label(list,l);
  2155. {
  2156. It is needed to perform GOT calculations using the scratch register R12
  2157. and then MOV the result to the GOT register. Otherwise the register allocator will use
  2158. register R0 as temp to perform calculations in case if a procedure uses all available registers.
  2159. It leads to corruption of R0 which is normally holds a value of the first procedure parameter.
  2160. }
  2161. list.concat(Taicpu.op_reg_reg_reg(A_ADD,NR_R12,NR_PC,NR_R12));
  2162. list.concat(Taicpu.op_reg_reg(A_MOV,current_procinfo.got,NR_R12));
  2163. a_reg_dealloc(list,NR_R12);
  2164. end;
  2165. end;
  2166. procedure tbasecgarm.a_loadaddr_ref_reg(list : TAsmList;const ref : treference;r : tregister);
  2167. var
  2168. b : byte;
  2169. tmpref : treference;
  2170. instr : taicpu;
  2171. begin
  2172. if ref.addressmode<>AM_OFFSET then
  2173. internalerror(200309071);
  2174. tmpref:=ref;
  2175. { Be sure to have a base register }
  2176. if (tmpref.base=NR_NO) then
  2177. begin
  2178. if tmpref.shiftmode<>SM_None then
  2179. internalerror(2014020702);
  2180. if tmpref.signindex<0 then
  2181. internalerror(200312023);
  2182. tmpref.base:=tmpref.index;
  2183. tmpref.index:=NR_NO;
  2184. end;
  2185. if assigned(tmpref.symbol) or
  2186. not((is_shifter_const(tmpref.offset,b)) or
  2187. (is_shifter_const(-tmpref.offset,b))
  2188. ) then
  2189. fixref(list,tmpref);
  2190. { expect a base here if there is an index }
  2191. if (tmpref.base=NR_NO) and (tmpref.index<>NR_NO) then
  2192. internalerror(200312022);
  2193. if tmpref.index<>NR_NO then
  2194. begin
  2195. if tmpref.shiftmode<>SM_None then
  2196. internalerror(200312021);
  2197. if tmpref.signindex<0 then
  2198. a_op_reg_reg_reg(list,OP_SUB,OS_ADDR,tmpref.base,tmpref.index,r)
  2199. else
  2200. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpref.base,tmpref.index,r);
  2201. if tmpref.offset<>0 then
  2202. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,r,r);
  2203. end
  2204. else
  2205. begin
  2206. if tmpref.base=NR_NO then
  2207. a_load_const_reg(list,OS_ADDR,tmpref.offset,r)
  2208. else
  2209. if tmpref.offset<>0 then
  2210. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,tmpref.base,r)
  2211. else
  2212. begin
  2213. instr:=taicpu.op_reg_reg(A_MOV,r,tmpref.base);
  2214. list.concat(instr);
  2215. add_move_instruction(instr);
  2216. end;
  2217. end;
  2218. end;
  2219. procedure tbasecgarm.fixref(list : TAsmList;var ref : treference);
  2220. var
  2221. tmpreg, tmpreg2 : tregister;
  2222. tmpref : treference;
  2223. l, piclabel : tasmlabel;
  2224. indirection_done : boolean;
  2225. begin
  2226. { absolute symbols can't be handled directly, we've to store the symbol reference
  2227. in the text segment and access it pc relative
  2228. For now, we assume that references where base or index equals to PC are already
  2229. relative, all other references are assumed to be absolute and thus they need
  2230. to be handled extra.
  2231. A proper solution would be to change refoptions to a set and store the information
  2232. if the symbol is absolute or relative there.
  2233. }
  2234. { create consts entry }
  2235. reference_reset(tmpref,4);
  2236. current_asmdata.getjumplabel(l);
  2237. cg.a_label(current_procinfo.aktlocaldata,l);
  2238. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  2239. piclabel:=nil;
  2240. tmpreg:=NR_NO;
  2241. indirection_done:=false;
  2242. if assigned(ref.symbol) then
  2243. begin
  2244. if (target_info.system=system_arm_darwin) and
  2245. (ref.symbol.bind in [AB_EXTERNAL,AB_WEAK_EXTERNAL,AB_PRIVATE_EXTERN,AB_COMMON]) then
  2246. begin
  2247. tmpreg:=g_indirect_sym_load(list,ref.symbol.name,asmsym2indsymflags(ref.symbol));
  2248. if ref.offset<>0 then
  2249. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2250. indirection_done:=true;
  2251. end
  2252. else if (cs_create_pic in current_settings.moduleswitches) then
  2253. if (tf_pic_uses_got in target_info.flags) then
  2254. current_procinfo.aktlocaldata.concat(tai_const.Create_type_sym(aitconst_got,ref.symbol))
  2255. else
  2256. begin
  2257. { ideally, we would want to generate
  2258. ldr r1, LPICConstPool
  2259. LPICLocal:
  2260. ldr/str r2,[pc,r1]
  2261. ...
  2262. LPICConstPool:
  2263. .long _globsym-(LPICLocal+8)
  2264. However, we cannot be sure that the ldr/str will follow
  2265. right after the call to fixref, so we have to load the
  2266. complete address already in a register.
  2267. }
  2268. current_asmdata.getaddrlabel(piclabel);
  2269. current_procinfo.aktlocaldata.concat(tai_const.Create_rel_sym_offset(aitconst_ptr,piclabel,ref.symbol,ref.offset-8));
  2270. end
  2271. else
  2272. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset))
  2273. end
  2274. else
  2275. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ref.offset));
  2276. { load consts entry }
  2277. if not indirection_done then
  2278. begin
  2279. tmpreg:=getintregister(list,OS_INT);
  2280. tmpref.symbol:=l;
  2281. tmpref.base:=NR_PC;
  2282. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2283. if (cs_create_pic in current_settings.moduleswitches) and
  2284. (tf_pic_uses_got in target_info.flags) and
  2285. assigned(ref.symbol) then
  2286. begin
  2287. reference_reset(tmpref,4);
  2288. tmpref.base:=current_procinfo.got;
  2289. tmpref.index:=tmpreg;
  2290. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  2291. if ref.offset<>0 then
  2292. a_op_const_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg);
  2293. end;
  2294. end;
  2295. if assigned(piclabel) then
  2296. begin
  2297. cg.a_label(list,piclabel);
  2298. tmpreg2:=getaddressregister(list);
  2299. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpreg,NR_PC,tmpreg2);
  2300. tmpreg:=tmpreg2
  2301. end;
  2302. { This routine can be called with PC as base/index in case the offset
  2303. was too large to encode in a load/store. In that case, the entire
  2304. absolute expression has been re-encoded in a new constpool entry, and
  2305. we have to remove the use of PC from the original reference (the code
  2306. above made everything relative to the value loaded from the new
  2307. constpool entry) }
  2308. if is_pc(ref.base) then
  2309. ref.base:=NR_NO;
  2310. if is_pc(ref.index) then
  2311. ref.index:=NR_NO;
  2312. if (ref.base<>NR_NO) then
  2313. begin
  2314. if ref.index<>NR_NO then
  2315. begin
  2316. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  2317. ref.base:=tmpreg;
  2318. end
  2319. else
  2320. if ref.base<>NR_PC then
  2321. begin
  2322. ref.index:=tmpreg;
  2323. ref.shiftimm:=0;
  2324. ref.signindex:=1;
  2325. ref.shiftmode:=SM_None;
  2326. end
  2327. else
  2328. ref.base:=tmpreg;
  2329. end
  2330. else
  2331. ref.base:=tmpreg;
  2332. ref.offset:=0;
  2333. ref.symbol:=nil;
  2334. end;
  2335. procedure tbasecgarm.g_concatcopy_move(list : TAsmList;const source,dest : treference;len : tcgint);
  2336. var
  2337. paraloc1,paraloc2,paraloc3 : TCGPara;
  2338. pd : tprocdef;
  2339. begin
  2340. pd:=search_system_proc('MOVE');
  2341. paraloc1.init;
  2342. paraloc2.init;
  2343. paraloc3.init;
  2344. paramanager.getintparaloc(list,pd,1,paraloc1);
  2345. paramanager.getintparaloc(list,pd,2,paraloc2);
  2346. paramanager.getintparaloc(list,pd,3,paraloc3);
  2347. a_load_const_cgpara(list,OS_SINT,len,paraloc3);
  2348. a_loadaddr_ref_cgpara(list,dest,paraloc2);
  2349. a_loadaddr_ref_cgpara(list,source,paraloc1);
  2350. paramanager.freecgpara(list,paraloc3);
  2351. paramanager.freecgpara(list,paraloc2);
  2352. paramanager.freecgpara(list,paraloc1);
  2353. alloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2354. alloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2355. a_call_name(list,'FPC_MOVE',false);
  2356. dealloccpuregisters(list,R_FPUREGISTER,paramanager.get_volatile_registers_fpu(pocall_default));
  2357. dealloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
  2358. paraloc3.done;
  2359. paraloc2.done;
  2360. paraloc1.done;
  2361. end;
  2362. procedure tbasecgarm.g_concatcopy_internal(list : TAsmList;const source,dest : treference;len : tcgint;aligned : boolean);
  2363. const
  2364. maxtmpreg_arm = 10; {roozbeh: can be reduced to 8 or lower if might conflick with reserved ones,also +2 is used becouse of regs required for referencing}
  2365. maxtmpreg_thumb = 5;
  2366. var
  2367. srcref,dstref,usedtmpref,usedtmpref2:treference;
  2368. srcreg,destreg,countreg,r,tmpreg:tregister;
  2369. helpsize:aint;
  2370. copysize:byte;
  2371. cgsize:Tcgsize;
  2372. tmpregisters:array[1..maxtmpreg_arm] of tregister;
  2373. maxtmpreg,
  2374. tmpregi,tmpregi2:byte;
  2375. { will never be called with count<=4 }
  2376. procedure genloop(count : aword;size : byte);
  2377. const
  2378. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2379. var
  2380. l : tasmlabel;
  2381. begin
  2382. current_asmdata.getjumplabel(l);
  2383. if count<size then size:=1;
  2384. a_load_const_reg(list,OS_INT,count div size,countreg);
  2385. cg.a_label(list,l);
  2386. srcref.addressmode:=AM_POSTINDEXED;
  2387. dstref.addressmode:=AM_POSTINDEXED;
  2388. srcref.offset:=size;
  2389. dstref.offset:=size;
  2390. r:=getintregister(list,size2opsize[size]);
  2391. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2392. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2393. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1),PF_S));
  2394. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2395. a_jmp_flags(list,F_NE,l);
  2396. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2397. srcref.offset:=1;
  2398. dstref.offset:=1;
  2399. case count mod size of
  2400. 1:
  2401. begin
  2402. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2403. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2404. end;
  2405. 2:
  2406. if aligned then
  2407. begin
  2408. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2409. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2410. end
  2411. else
  2412. begin
  2413. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2414. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2415. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2416. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2417. end;
  2418. 3:
  2419. if aligned then
  2420. begin
  2421. srcref.offset:=2;
  2422. dstref.offset:=2;
  2423. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2424. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2425. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2426. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2427. end
  2428. else
  2429. begin
  2430. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2431. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2432. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2433. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2434. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2435. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2436. end;
  2437. end;
  2438. { keep the registers alive }
  2439. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2440. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2441. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2442. end;
  2443. { will never be called with count<=4 }
  2444. procedure genloop_thumb(count : aword;size : byte);
  2445. procedure refincofs(const ref : treference;const value : longint = 1);
  2446. begin
  2447. a_op_const_reg(list,OP_ADD,OS_ADDR,value,ref.base);
  2448. end;
  2449. const
  2450. size2opsize : array[1..4] of tcgsize = (OS_8,OS_16,OS_NO,OS_32);
  2451. var
  2452. l : tasmlabel;
  2453. begin
  2454. current_asmdata.getjumplabel(l);
  2455. if count<size then size:=1;
  2456. a_load_const_reg(list,OS_INT,count div size,countreg);
  2457. cg.a_label(list,l);
  2458. r:=getintregister(list,size2opsize[size]);
  2459. a_load_ref_reg(list,size2opsize[size],size2opsize[size],srcref,r);
  2460. refincofs(srcref);
  2461. a_load_reg_ref(list,size2opsize[size],size2opsize[size],r,dstref);
  2462. refincofs(dstref);
  2463. a_reg_alloc(list,NR_DEFAULTFLAGS);
  2464. list.concat(taicpu.op_reg_reg_const(A_SUB,countreg,countreg,1));
  2465. a_jmp_flags(list,F_NE,l);
  2466. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2467. case count mod size of
  2468. 1:
  2469. begin
  2470. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2471. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2472. end;
  2473. 2:
  2474. if aligned then
  2475. begin
  2476. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2477. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2478. end
  2479. else
  2480. begin
  2481. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2482. refincofs(srcref);
  2483. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2484. refincofs(dstref);
  2485. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2486. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2487. end;
  2488. 3:
  2489. if aligned then
  2490. begin
  2491. a_load_ref_reg(list,OS_16,OS_16,srcref,r);
  2492. refincofs(srcref,2);
  2493. a_load_reg_ref(list,OS_16,OS_16,r,dstref);
  2494. refincofs(dstref,2);
  2495. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2496. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2497. end
  2498. else
  2499. begin
  2500. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2501. refincofs(srcref);
  2502. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2503. refincofs(dstref);
  2504. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2505. refincofs(srcref);
  2506. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2507. refincofs(dstref);
  2508. a_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2509. a_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2510. end;
  2511. end;
  2512. { keep the registers alive }
  2513. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  2514. list.concat(taicpu.op_reg_reg(A_MOV,srcreg,srcreg));
  2515. list.concat(taicpu.op_reg_reg(A_MOV,destreg,destreg));
  2516. end;
  2517. begin
  2518. if len=0 then
  2519. exit;
  2520. if GenerateThumbCode then
  2521. maxtmpreg:=maxtmpreg_thumb
  2522. else
  2523. maxtmpreg:=maxtmpreg_arm;
  2524. helpsize:=12+maxtmpreg*4;//52 with maxtmpreg=10
  2525. dstref:=dest;
  2526. srcref:=source;
  2527. if cs_opt_size in current_settings.optimizerswitches then
  2528. helpsize:=8;
  2529. if aligned and (len=4) then
  2530. begin
  2531. tmpreg:=getintregister(list,OS_32);
  2532. a_load_ref_reg(list,OS_32,OS_32,source,tmpreg);
  2533. a_load_reg_ref(list,OS_32,OS_32,tmpreg,dest);
  2534. end
  2535. else if aligned and (len=2) then
  2536. begin
  2537. tmpreg:=getintregister(list,OS_16);
  2538. a_load_ref_reg(list,OS_16,OS_16,source,tmpreg);
  2539. a_load_reg_ref(list,OS_16,OS_16,tmpreg,dest);
  2540. end
  2541. else if (len<=helpsize) and aligned then
  2542. begin
  2543. tmpregi:=0;
  2544. srcreg:=getintregister(list,OS_ADDR);
  2545. { explicit pc relative addressing, could be
  2546. e.g. a floating point constant }
  2547. if source.base=NR_PC then
  2548. begin
  2549. { ... then we don't need a loadaddr }
  2550. srcref:=source;
  2551. end
  2552. else
  2553. begin
  2554. a_loadaddr_ref_reg(list,source,srcreg);
  2555. reference_reset_base(srcref,srcreg,0,source.alignment);
  2556. end;
  2557. while (len div 4 <> 0) and (tmpregi<maxtmpreg) do
  2558. begin
  2559. inc(tmpregi);
  2560. tmpregisters[tmpregi]:=getintregister(list,OS_32);
  2561. a_load_ref_reg(list,OS_32,OS_32,srcref,tmpregisters[tmpregi]);
  2562. inc(srcref.offset,4);
  2563. dec(len,4);
  2564. end;
  2565. destreg:=getintregister(list,OS_ADDR);
  2566. a_loadaddr_ref_reg(list,dest,destreg);
  2567. reference_reset_base(dstref,destreg,0,dest.alignment);
  2568. tmpregi2:=1;
  2569. while (tmpregi2<=tmpregi) do
  2570. begin
  2571. a_load_reg_ref(list,OS_32,OS_32,tmpregisters[tmpregi2],dstref);
  2572. inc(dstref.offset,4);
  2573. inc(tmpregi2);
  2574. end;
  2575. copysize:=4;
  2576. cgsize:=OS_32;
  2577. while len<>0 do
  2578. begin
  2579. if len<2 then
  2580. begin
  2581. copysize:=1;
  2582. cgsize:=OS_8;
  2583. end
  2584. else if len<4 then
  2585. begin
  2586. copysize:=2;
  2587. cgsize:=OS_16;
  2588. end;
  2589. dec(len,copysize);
  2590. r:=getintregister(list,cgsize);
  2591. a_load_ref_reg(list,cgsize,cgsize,srcref,r);
  2592. a_load_reg_ref(list,cgsize,cgsize,r,dstref);
  2593. inc(srcref.offset,copysize);
  2594. inc(dstref.offset,copysize);
  2595. end;{end of while}
  2596. end
  2597. else
  2598. begin
  2599. cgsize:=OS_32;
  2600. if (len<=4) then{len<=4 and not aligned}
  2601. begin
  2602. r:=getintregister(list,cgsize);
  2603. usedtmpref:=a_internal_load_ref_reg(list,OS_8,OS_8,srcref,r);
  2604. if Len=1 then
  2605. a_load_reg_ref(list,OS_8,OS_8,r,dstref)
  2606. else
  2607. begin
  2608. tmpreg:=getintregister(list,cgsize);
  2609. usedtmpref2:=a_internal_load_reg_ref(list,OS_8,OS_8,r,dstref);
  2610. inc(usedtmpref.offset,1);
  2611. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2612. inc(usedtmpref2.offset,1);
  2613. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2614. if len>2 then
  2615. begin
  2616. inc(usedtmpref.offset,1);
  2617. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2618. inc(usedtmpref2.offset,1);
  2619. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2620. if len>3 then
  2621. begin
  2622. inc(usedtmpref.offset,1);
  2623. a_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  2624. inc(usedtmpref2.offset,1);
  2625. a_load_reg_ref(list,OS_8,OS_8,tmpreg,usedtmpref2);
  2626. end;
  2627. end;
  2628. end;
  2629. end{end of if len<=4}
  2630. else
  2631. begin{unaligned & 4<len<helpsize **or** aligned/unaligned & len>helpsize}
  2632. destreg:=getintregister(list,OS_ADDR);
  2633. a_loadaddr_ref_reg(list,dest,destreg);
  2634. reference_reset_base(dstref,destreg,0,dest.alignment);
  2635. srcreg:=getintregister(list,OS_ADDR);
  2636. a_loadaddr_ref_reg(list,source,srcreg);
  2637. reference_reset_base(srcref,srcreg,0,source.alignment);
  2638. countreg:=getintregister(list,OS_32);
  2639. // if cs_opt_size in current_settings.optimizerswitches then
  2640. { roozbeh : it seems loading 1 byte is faster becouse of caching/fetching(?) }
  2641. {if aligned then
  2642. genloop(len,4)
  2643. else}
  2644. if GenerateThumbCode then
  2645. genloop_thumb(len,1)
  2646. else
  2647. genloop(len,1);
  2648. end;
  2649. end;
  2650. end;
  2651. procedure tbasecgarm.g_concatcopy_unaligned(list : TAsmList;const source,dest : treference;len : tcgint);
  2652. begin
  2653. g_concatcopy_internal(list,source,dest,len,false);
  2654. end;
  2655. procedure tbasecgarm.g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);
  2656. begin
  2657. if (source.alignment in [1,3]) or
  2658. (dest.alignment in [1,3]) then
  2659. g_concatcopy_internal(list,source,dest,len,false)
  2660. else
  2661. g_concatcopy_internal(list,source,dest,len,true);
  2662. end;
  2663. procedure tbasecgarm.g_overflowCheck(list : TAsmList;const l : tlocation;def : tdef);
  2664. var
  2665. ovloc : tlocation;
  2666. begin
  2667. ovloc.loc:=LOC_VOID;
  2668. g_overflowCheck_loc(list,l,def,ovloc);
  2669. end;
  2670. procedure tbasecgarm.g_overflowCheck_loc(List:TAsmList;const Loc:TLocation;def:TDef;ovloc : tlocation);
  2671. var
  2672. hl : tasmlabel;
  2673. ai:TAiCpu;
  2674. hflags : tresflags;
  2675. begin
  2676. if not(cs_check_overflow in current_settings.localswitches) then
  2677. exit;
  2678. current_asmdata.getjumplabel(hl);
  2679. case ovloc.loc of
  2680. LOC_VOID:
  2681. begin
  2682. ai:=taicpu.op_sym(A_B,hl);
  2683. ai.is_jmp:=true;
  2684. if not((def.typ=pointerdef) or
  2685. ((def.typ=orddef) and
  2686. (torddef(def).ordtype in [u64bit,u16bit,u32bit,u8bit,uchar,
  2687. pasbool8,pasbool16,pasbool32,pasbool64]))) then
  2688. ai.SetCondition(C_VC)
  2689. else
  2690. if TAiCpu(List.Last).opcode in [A_RSB,A_RSC,A_SBC,A_SUB] then
  2691. ai.SetCondition(C_CS)
  2692. else
  2693. ai.SetCondition(C_CC);
  2694. list.concat(ai);
  2695. end;
  2696. LOC_FLAGS:
  2697. begin
  2698. hflags:=ovloc.resflags;
  2699. inverse_flags(hflags);
  2700. cg.a_jmp_flags(list,hflags,hl);
  2701. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2702. end;
  2703. else
  2704. internalerror(200409281);
  2705. end;
  2706. a_call_name(list,'FPC_OVERFLOW',false);
  2707. a_label(list,hl);
  2708. end;
  2709. procedure tbasecgarm.g_save_registers(list : TAsmList);
  2710. begin
  2711. { this work is done in g_proc_entry }
  2712. end;
  2713. procedure tbasecgarm.g_restore_registers(list : TAsmList);
  2714. begin
  2715. { this work is done in g_proc_exit }
  2716. end;
  2717. procedure tbasecgarm.a_jmp_cond(list : TAsmList;cond : TOpCmp;l: tasmlabel);
  2718. var
  2719. ai : taicpu;
  2720. hlabel : TAsmLabel;
  2721. begin
  2722. if GenerateThumbCode then
  2723. begin
  2724. { the optimizer has to fix this if jump range is sufficient short }
  2725. current_asmdata.getjumplabel(hlabel);
  2726. ai:=Taicpu.Op_sym(A_B,hlabel);
  2727. ai.SetCondition(inverse_cond(OpCmp2AsmCond[cond]));
  2728. ai.is_jmp:=true;
  2729. list.concat(ai);
  2730. a_jmp_always(list,l);
  2731. a_label(list,hlabel);
  2732. end
  2733. else
  2734. begin
  2735. ai:=Taicpu.Op_sym(A_B,l);
  2736. ai.SetCondition(OpCmp2AsmCond[cond]);
  2737. ai.is_jmp:=true;
  2738. list.concat(ai);
  2739. end;
  2740. end;
  2741. function get_scalar_mm_op(fromsize,tosize : tcgsize) : tasmop;
  2742. const
  2743. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of tasmop = (
  2744. (A_VMOV,A_VCVT,A_NONE,A_NONE,A_NONE),
  2745. (A_VCVT,A_VMOV,A_NONE,A_NONE,A_NONE),
  2746. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2747. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE),
  2748. (A_NONE,A_NONE,A_NONE,A_NONE,A_NONE));
  2749. begin
  2750. result:=convertop[fromsize,tosize];
  2751. if result=A_NONE then
  2752. internalerror(200312205);
  2753. end;
  2754. function get_scalar_mm_prefix(fromsize,tosize : tcgsize) : TOpPostfix;
  2755. const
  2756. convertop : array[OS_F32..OS_F128,OS_F32..OS_F128] of TOpPostfix = (
  2757. (PF_F32, PF_F32F64,PF_None,PF_None,PF_None),
  2758. (PF_F64F32,PF_F64, PF_None,PF_None,PF_None),
  2759. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2760. (PF_None, PF_None, PF_None,PF_None,PF_None),
  2761. (PF_None, PF_None, PF_None,PF_None,PF_None));
  2762. begin
  2763. result:=convertop[fromsize,tosize];
  2764. end;
  2765. procedure tbasecgarm.a_loadmm_reg_reg(list: tasmlist; fromsize,tosize: tcgsize; reg1,reg2: tregister; shuffle: pmmshuffle);
  2766. var
  2767. instr: taicpu;
  2768. begin
  2769. if (shuffle=nil) or shufflescalar(shuffle) then
  2770. instr:=setoppostfix(taicpu.op_reg_reg(get_scalar_mm_op(tosize,fromsize),reg2,reg1),get_scalar_mm_prefix(tosize,fromsize))
  2771. else
  2772. internalerror(2009112407);
  2773. list.concat(instr);
  2774. case instr.opcode of
  2775. A_VMOV:
  2776. add_move_instruction(instr);
  2777. end;
  2778. end;
  2779. procedure tbasecgarm.a_loadmm_ref_reg(list: tasmlist; fromsize,tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  2780. var
  2781. intreg,
  2782. tmpmmreg : tregister;
  2783. reg64 : tregister64;
  2784. begin
  2785. if assigned(shuffle) and
  2786. not(shufflescalar(shuffle)) then
  2787. internalerror(2009112413);
  2788. case fromsize of
  2789. OS_32,OS_S32:
  2790. begin
  2791. fromsize:=OS_F32;
  2792. { since we are loading an integer, no conversion may be required }
  2793. if (fromsize<>tosize) then
  2794. internalerror(2009112801);
  2795. end;
  2796. OS_64,OS_S64:
  2797. begin
  2798. fromsize:=OS_F64;
  2799. { since we are loading an integer, no conversion may be required }
  2800. if (fromsize<>tosize) then
  2801. internalerror(2009112901);
  2802. end;
  2803. end;
  2804. if (fromsize<>tosize) then
  2805. tmpmmreg:=getmmregister(list,fromsize)
  2806. else
  2807. tmpmmreg:=reg;
  2808. if (ref.alignment in [1,2]) then
  2809. begin
  2810. case fromsize of
  2811. OS_F32:
  2812. begin
  2813. intreg:=getintregister(list,OS_32);
  2814. a_load_ref_reg(list,OS_32,OS_32,ref,intreg);
  2815. a_loadmm_intreg_reg(list,OS_32,OS_F32,intreg,tmpmmreg,mms_movescalar);
  2816. end;
  2817. OS_F64:
  2818. begin
  2819. reg64.reglo:=getintregister(list,OS_32);
  2820. reg64.reghi:=getintregister(list,OS_32);
  2821. cg64.a_load64_ref_reg(list,ref,reg64);
  2822. cg64.a_loadmm_intreg64_reg(list,OS_F64,reg64,tmpmmreg);
  2823. end;
  2824. else
  2825. internalerror(2009112412);
  2826. end;
  2827. end
  2828. else
  2829. begin
  2830. handle_load_store(list,A_VLDR,PF_None,tmpmmreg,ref);
  2831. end;
  2832. if (tmpmmreg<>reg) then
  2833. a_loadmm_reg_reg(list,fromsize,tosize,tmpmmreg,reg,shuffle);
  2834. end;
  2835. procedure tbasecgarm.a_loadmm_reg_ref(list: tasmlist; fromsize,tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  2836. var
  2837. intreg,
  2838. tmpmmreg : tregister;
  2839. reg64 : tregister64;
  2840. begin
  2841. if assigned(shuffle) and
  2842. not(shufflescalar(shuffle)) then
  2843. internalerror(2009112416);
  2844. case tosize of
  2845. OS_32,OS_S32:
  2846. begin
  2847. tosize:=OS_F32;
  2848. { since we are loading an integer, no conversion may be required }
  2849. if (fromsize<>tosize) then
  2850. internalerror(2009112801);
  2851. end;
  2852. OS_64,OS_S64:
  2853. begin
  2854. tosize:=OS_F64;
  2855. { since we are loading an integer, no conversion may be required }
  2856. if (fromsize<>tosize) then
  2857. internalerror(2009112901);
  2858. end;
  2859. end;
  2860. if (fromsize<>tosize) then
  2861. begin
  2862. tmpmmreg:=getmmregister(list,tosize);
  2863. a_loadmm_reg_reg(list,fromsize,tosize,reg,tmpmmreg,shuffle);
  2864. end
  2865. else
  2866. tmpmmreg:=reg;
  2867. if (ref.alignment in [1,2]) then
  2868. begin
  2869. case tosize of
  2870. OS_F32:
  2871. begin
  2872. intreg:=getintregister(list,OS_32);
  2873. a_loadmm_reg_intreg(list,OS_F32,OS_32,tmpmmreg,intreg,shuffle);
  2874. a_load_reg_ref(list,OS_32,OS_32,intreg,ref);
  2875. end;
  2876. OS_F64:
  2877. begin
  2878. reg64.reglo:=getintregister(list,OS_32);
  2879. reg64.reghi:=getintregister(list,OS_32);
  2880. cg64.a_loadmm_reg_intreg64(list,OS_F64,tmpmmreg,reg64);
  2881. cg64.a_load64_reg_ref(list,reg64,ref);
  2882. end;
  2883. else
  2884. internalerror(2009112417);
  2885. end;
  2886. end
  2887. else
  2888. begin
  2889. handle_load_store(list,A_VSTR,PF_None,tmpmmreg,ref);
  2890. end;
  2891. end;
  2892. procedure tbasecgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize : tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  2893. begin
  2894. { this code can only be used to transfer raw data, not to perform
  2895. conversions }
  2896. if (tosize<>OS_F32) then
  2897. internalerror(2009112419);
  2898. if not(fromsize in [OS_32,OS_S32]) then
  2899. internalerror(2009112420);
  2900. if assigned(shuffle) and
  2901. not shufflescalar(shuffle) then
  2902. internalerror(2009112516);
  2903. list.concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg));
  2904. end;
  2905. procedure tbasecgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize : tcgsize; mmreg, intreg: tregister;shuffle : pmmshuffle);
  2906. begin
  2907. { this code can only be used to transfer raw data, not to perform
  2908. conversions }
  2909. if (fromsize<>OS_F32) then
  2910. internalerror(2009112430);
  2911. if not(tosize in [OS_32,OS_S32]) then
  2912. internalerror(2009112420);
  2913. if assigned(shuffle) and
  2914. not shufflescalar(shuffle) then
  2915. internalerror(2009112514);
  2916. list.concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg));
  2917. end;
  2918. procedure tbasecgarm.a_opmm_reg_reg(list: tasmlist; op: topcg; size: tcgsize; src, dst: tregister; shuffle: pmmshuffle);
  2919. var
  2920. tmpreg: tregister;
  2921. begin
  2922. { the vfp doesn't support xor nor any other logical operation, but
  2923. this routine is used to initialise global mm regvars. We can
  2924. easily initialise an mm reg with 0 though. }
  2925. case op of
  2926. OP_XOR:
  2927. begin
  2928. if (src<>dst) or
  2929. (reg_cgsize(src)<>size) or
  2930. assigned(shuffle) then
  2931. internalerror(2009112907);
  2932. tmpreg:=getintregister(list,OS_32);
  2933. a_load_const_reg(list,OS_32,0,tmpreg);
  2934. case size of
  2935. OS_F32:
  2936. list.concat(taicpu.op_reg_reg(A_VMOV,dst,tmpreg));
  2937. OS_F64:
  2938. list.concat(taicpu.op_reg_reg_reg(A_VMOV,dst,tmpreg,tmpreg));
  2939. else
  2940. internalerror(2009112908);
  2941. end;
  2942. end
  2943. else
  2944. internalerror(2009112906);
  2945. end;
  2946. end;
  2947. procedure tbasecgarm.maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  2948. const
  2949. overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NEG];
  2950. begin
  2951. if (op in overflowops) and
  2952. (size in [OS_8,OS_S8,OS_16,OS_S16]) then
  2953. a_load_reg_reg(list,OS_32,size,dst,dst);
  2954. end;
  2955. procedure tbasecgarm.safe_mla(list : TAsmList; op1,op2,op3,op4 : TRegister);
  2956. procedure checkreg(var reg : TRegister);
  2957. var
  2958. tmpreg : TRegister;
  2959. begin
  2960. if ((GenerateThumbCode or GenerateThumb2Code) and (getsupreg(reg)=RS_R13)) or
  2961. (getsupreg(reg)=RS_R15) then
  2962. begin
  2963. tmpreg:=getintregister(list,OS_INT);
  2964. a_load_reg_reg(list,OS_INT,OS_INT,reg,tmpreg);
  2965. reg:=tmpreg;
  2966. end;
  2967. end;
  2968. begin
  2969. checkreg(op1);
  2970. checkreg(op2);
  2971. checkreg(op3);
  2972. checkreg(op4);
  2973. list.concat(taicpu.op_reg_reg_reg_reg(A_MLA,op1,op2,op3,op4));
  2974. end;
  2975. procedure tcg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  2976. begin
  2977. case op of
  2978. OP_NEG:
  2979. begin
  2980. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  2981. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  2982. list.concat(taicpu.op_reg_reg_const(A_RSC,regdst.reghi,regsrc.reghi,0));
  2983. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  2984. end;
  2985. OP_NOT:
  2986. begin
  2987. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  2988. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  2989. end;
  2990. else
  2991. a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);
  2992. end;
  2993. end;
  2994. procedure tcg64farm.a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);
  2995. begin
  2996. a_op64_const_reg_reg(list,op,size,value,reg,reg);
  2997. end;
  2998. procedure tcg64farm.a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);
  2999. var
  3000. ovloc : tlocation;
  3001. begin
  3002. a_op64_const_reg_reg_checkoverflow(list,op,size,value,regsrc,regdst,false,ovloc);
  3003. end;
  3004. procedure tcg64farm.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);
  3005. var
  3006. ovloc : tlocation;
  3007. begin
  3008. a_op64_reg_reg_reg_checkoverflow(list,op,size,regsrc1,regsrc2,regdst,false,ovloc);
  3009. end;
  3010. procedure tcg64farm.a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);
  3011. begin
  3012. { this code can only be used to transfer raw data, not to perform
  3013. conversions }
  3014. if (mmsize<>OS_F64) then
  3015. internalerror(2009112405);
  3016. list.concat(taicpu.op_reg_reg_reg(A_VMOV,mmreg,intreg.reglo,intreg.reghi));
  3017. end;
  3018. procedure tcg64farm.a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);
  3019. begin
  3020. { this code can only be used to transfer raw data, not to perform
  3021. conversions }
  3022. if (mmsize<>OS_F64) then
  3023. internalerror(2009112406);
  3024. list.concat(taicpu.op_reg_reg_reg(A_VMOV,intreg.reglo,intreg.reghi,mmreg));
  3025. end;
  3026. procedure tcg64farm.a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3027. var
  3028. tmpreg : tregister;
  3029. b : byte;
  3030. begin
  3031. ovloc.loc:=LOC_VOID;
  3032. case op of
  3033. OP_NEG,
  3034. OP_NOT :
  3035. internalerror(2012022501);
  3036. end;
  3037. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3038. begin
  3039. case op of
  3040. OP_ADD:
  3041. begin
  3042. if is_shifter_const(lo(value),b) then
  3043. begin
  3044. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3045. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3046. end
  3047. else
  3048. begin
  3049. tmpreg:=cg.getintregister(list,OS_32);
  3050. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3051. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3052. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3053. end;
  3054. if is_shifter_const(hi(value),b) then
  3055. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,hi(value)),PF_S))
  3056. else
  3057. begin
  3058. tmpreg:=cg.getintregister(list,OS_32);
  3059. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3060. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3061. end;
  3062. end;
  3063. OP_SUB:
  3064. begin
  3065. if is_shifter_const(lo(value),b) then
  3066. begin
  3067. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3068. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,lo(value)),PF_S))
  3069. end
  3070. else
  3071. begin
  3072. tmpreg:=cg.getintregister(list,OS_32);
  3073. cg.a_load_const_reg(list,OS_32,lo(value),tmpreg);
  3074. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3075. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3076. end;
  3077. if is_shifter_const(hi(value),b) then
  3078. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))),PF_S))
  3079. else
  3080. begin
  3081. tmpreg:=cg.getintregister(list,OS_32);
  3082. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3083. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg),PF_S));
  3084. end;
  3085. end;
  3086. else
  3087. internalerror(200502131);
  3088. end;
  3089. if size=OS_64 then
  3090. begin
  3091. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3092. ovloc.loc:=LOC_FLAGS;
  3093. case op of
  3094. OP_ADD:
  3095. ovloc.resflags:=F_CS;
  3096. OP_SUB:
  3097. ovloc.resflags:=F_CC;
  3098. end;
  3099. end;
  3100. end
  3101. else
  3102. begin
  3103. case op of
  3104. OP_AND,OP_OR,OP_XOR:
  3105. begin
  3106. cg.a_op_const_reg_reg(list,op,OS_32,aint(lo(value)),regsrc.reglo,regdst.reglo);
  3107. cg.a_op_const_reg_reg(list,op,OS_32,aint(hi(value)),regsrc.reghi,regdst.reghi);
  3108. end;
  3109. OP_ADD:
  3110. begin
  3111. if is_shifter_const(aint(lo(value)),b) then
  3112. begin
  3113. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3114. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_ADD,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3115. end
  3116. else
  3117. begin
  3118. tmpreg:=cg.getintregister(list,OS_32);
  3119. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3120. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3121. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3122. end;
  3123. if is_shifter_const(aint(hi(value)),b) then
  3124. list.concat(taicpu.op_reg_reg_const(A_ADC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3125. else
  3126. begin
  3127. tmpreg:=cg.getintregister(list,OS_32);
  3128. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  3129. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc.reghi,tmpreg));
  3130. end;
  3131. end;
  3132. OP_SUB:
  3133. begin
  3134. if is_shifter_const(aint(lo(value)),b) then
  3135. begin
  3136. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3137. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_SUB,regdst.reglo,regsrc.reglo,aint(lo(value))),PF_S))
  3138. end
  3139. else
  3140. begin
  3141. tmpreg:=cg.getintregister(list,OS_32);
  3142. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  3143. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3144. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc.reglo,tmpreg),PF_S));
  3145. end;
  3146. if is_shifter_const(aint(hi(value)),b) then
  3147. list.concat(taicpu.op_reg_reg_const(A_SBC,regdst.reghi,regsrc.reghi,aint(hi(value))))
  3148. else
  3149. begin
  3150. tmpreg:=cg.getintregister(list,OS_32);
  3151. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  3152. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc.reghi,tmpreg));
  3153. end;
  3154. end;
  3155. else
  3156. internalerror(2003083101);
  3157. end;
  3158. end;
  3159. end;
  3160. procedure tcg64farm.a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);
  3161. begin
  3162. ovloc.loc:=LOC_VOID;
  3163. case op of
  3164. OP_NEG,
  3165. OP_NOT :
  3166. internalerror(2012022502);
  3167. end;
  3168. if (setflags or tbasecgarm(cg).cgsetflags) and (op in [OP_ADD,OP_SUB]) then
  3169. begin
  3170. case op of
  3171. OP_ADD:
  3172. begin
  3173. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3174. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3175. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi),PF_S));
  3176. end;
  3177. OP_SUB:
  3178. begin
  3179. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3180. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3181. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi),PF_S));
  3182. end;
  3183. else
  3184. internalerror(2003083101);
  3185. end;
  3186. if size=OS_64 then
  3187. begin
  3188. { the arm has an weired opinion how flags for SUB/ADD are handled }
  3189. ovloc.loc:=LOC_FLAGS;
  3190. case op of
  3191. OP_ADD:
  3192. ovloc.resflags:=F_CS;
  3193. OP_SUB:
  3194. ovloc.resflags:=F_CC;
  3195. end;
  3196. end;
  3197. end
  3198. else
  3199. begin
  3200. case op of
  3201. OP_AND,OP_OR,OP_XOR:
  3202. begin
  3203. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);
  3204. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);
  3205. end;
  3206. OP_ADD:
  3207. begin
  3208. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3209. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_ADD,regdst.reglo,regsrc1.reglo,regsrc2.reglo),PF_S));
  3210. list.concat(taicpu.op_reg_reg_reg(A_ADC,regdst.reghi,regsrc1.reghi,regsrc2.reghi));
  3211. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3212. end;
  3213. OP_SUB:
  3214. begin
  3215. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  3216. list.concat(setoppostfix(taicpu.op_reg_reg_reg(A_SUB,regdst.reglo,regsrc2.reglo,regsrc1.reglo),PF_S));
  3217. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,regsrc2.reghi,regsrc1.reghi));
  3218. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3219. end;
  3220. else
  3221. internalerror(2003083101);
  3222. end;
  3223. end;
  3224. end;
  3225. procedure tthumbcgarm.init_register_allocators;
  3226. begin
  3227. inherited init_register_allocators;
  3228. if assigned(current_procinfo) and (current_procinfo.framepointer=NR_R7) then
  3229. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3230. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6],first_int_imreg,[])
  3231. else
  3232. rg[R_INTREGISTER]:=trgintcputhumb.create(R_INTREGISTER,R_SUBWHOLE,
  3233. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7],first_int_imreg,[]);
  3234. end;
  3235. procedure tthumbcgarm.done_register_allocators;
  3236. begin
  3237. rg[R_INTREGISTER].free;
  3238. rg[R_FPUREGISTER].free;
  3239. rg[R_MMREGISTER].free;
  3240. inherited done_register_allocators;
  3241. end;
  3242. procedure tthumbcgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  3243. var
  3244. ref : treference;
  3245. shift : byte;
  3246. r : byte;
  3247. regs, saveregs : tcpuregisterset;
  3248. r7offset,
  3249. stackmisalignment : pint;
  3250. postfix: toppostfix;
  3251. registerarea,
  3252. imm1, imm2: DWord;
  3253. stack_parameters: Boolean;
  3254. begin
  3255. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3256. LocalSize:=align(LocalSize,4);
  3257. { call instruction does not put anything on the stack }
  3258. stackmisalignment:=0;
  3259. if not(nostackframe) then
  3260. begin
  3261. a_reg_alloc(list,NR_STACK_POINTER_REG);
  3262. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3263. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  3264. { save int registers }
  3265. reference_reset(ref,4);
  3266. ref.index:=NR_STACK_POINTER_REG;
  3267. ref.addressmode:=AM_PREINDEXED;
  3268. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3269. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3270. begin
  3271. //!!!! a_reg_alloc(list,NR_R12);
  3272. //!!!! list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  3273. end;
  3274. { the (old) ARM APCS requires saving both the stack pointer (to
  3275. crawl the stack) and the PC (to identify the function this
  3276. stack frame belongs to) -> also save R12 (= copy of R13 on entry)
  3277. and R15 -- still needs updating for EABI and Darwin, they don't
  3278. need that }
  3279. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3280. regs:=regs+[RS_R7,RS_R14]
  3281. else
  3282. // if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  3283. include(regs,RS_R14);
  3284. { safely estimate stack size }
  3285. if localsize+current_settings.alignment.localalignmax+4>508 then
  3286. begin
  3287. include(rg[R_INTREGISTER].used_in_proc,RS_R4);
  3288. include(regs,RS_R4);
  3289. end;
  3290. registerarea:=0;
  3291. if regs<>[] then
  3292. begin
  3293. for r:=RS_R0 to RS_R15 do
  3294. if r in regs then
  3295. inc(registerarea,4);
  3296. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,regs));
  3297. end;
  3298. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3299. if stack_parameters or (LocalSize<>0) or
  3300. ((stackmisalignment<>0) and
  3301. ((pi_do_call in current_procinfo.flags) or
  3302. (po_assembler in current_procinfo.procdef.procoptions))) then
  3303. begin
  3304. { do we access stack parameters?
  3305. if yes, the previously estimated stacksize must be used }
  3306. if stack_parameters then
  3307. begin
  3308. if localsize>tarmprocinfo(current_procinfo).stackframesize then
  3309. begin
  3310. writeln(localsize);
  3311. writeln(tarmprocinfo(current_procinfo).stackframesize);
  3312. internalerror(2013040601);
  3313. end
  3314. else
  3315. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea;
  3316. end
  3317. else
  3318. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3319. if localsize<508 then
  3320. begin
  3321. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  3322. end
  3323. else if localsize<=1016 then
  3324. begin
  3325. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3326. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize-508));
  3327. end
  3328. else
  3329. begin
  3330. a_load_const_reg(list,OS_ADDR,-localsize,NR_R4);
  3331. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R4));
  3332. include(regs,RS_R4);
  3333. //!!!! if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  3334. //!!!! a_reg_alloc(list,NR_R12);
  3335. //!!!! a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  3336. //!!!! list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  3337. //!!!! a_reg_dealloc(list,NR_R12);
  3338. end;
  3339. end;
  3340. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3341. begin
  3342. list.concat(taicpu.op_reg_reg_const(A_ADD,current_procinfo.framepointer,NR_STACK_POINTER_REG,0));
  3343. end;
  3344. end;
  3345. end;
  3346. procedure tthumbcgarm.g_proc_exit(list: TAsmList; parasize: longint; nostackframe: boolean);
  3347. var
  3348. ref : treference;
  3349. LocalSize : longint;
  3350. r,
  3351. shift : byte;
  3352. saveregs,
  3353. regs : tcpuregisterset;
  3354. registerarea : DWord;
  3355. stackmisalignment: pint;
  3356. imm1, imm2: DWord;
  3357. stack_parameters : Boolean;
  3358. begin
  3359. if not(nostackframe) then
  3360. begin
  3361. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  3362. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  3363. include(regs,RS_R15);
  3364. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  3365. include(regs,getsupreg(current_procinfo.framepointer));
  3366. registerarea:=0;
  3367. for r:=RS_R0 to RS_R15 do
  3368. if r in regs then
  3369. inc(registerarea,4);
  3370. stackmisalignment:=registerarea mod current_settings.alignment.localalignmax;
  3371. LocalSize:=current_procinfo.calc_stackframe_size;
  3372. if stack_parameters then
  3373. localsize:=tarmprocinfo(current_procinfo).stackframesize-registerarea
  3374. else
  3375. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  3376. if (current_procinfo.framepointer=NR_STACK_POINTER_REG) or
  3377. (target_info.system in systems_darwin) then
  3378. begin
  3379. if (LocalSize<>0) or
  3380. ((stackmisalignment<>0) and
  3381. ((pi_do_call in current_procinfo.flags) or
  3382. (po_assembler in current_procinfo.procdef.procoptions))) then
  3383. begin
  3384. if LocalSize=0 then
  3385. else if LocalSize<=508 then
  3386. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize))
  3387. else if LocalSize<=1016 then
  3388. begin
  3389. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,508));
  3390. list.concat(taicpu.op_reg_reg_const(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,localsize-508));
  3391. end
  3392. else
  3393. begin
  3394. a_reg_alloc(list,NR_R3);
  3395. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R3);
  3396. list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R3));
  3397. a_reg_dealloc(list,NR_R3);
  3398. end;
  3399. end;
  3400. if regs=[] then
  3401. begin
  3402. if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3403. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3404. else
  3405. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3406. end
  3407. else
  3408. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,regs));
  3409. end;
  3410. end
  3411. else if not(CPUARM_HAS_BX in cpu_capabilities[current_settings.cputype]) then
  3412. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14))
  3413. else
  3414. list.concat(taicpu.op_reg(A_BX,NR_R14))
  3415. end;
  3416. procedure tthumbcgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3417. var
  3418. oppostfix:toppostfix;
  3419. usedtmpref: treference;
  3420. tmpreg,tmpreg2 : tregister;
  3421. dir : integer;
  3422. begin
  3423. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3424. FromSize := ToSize;
  3425. case FromSize of
  3426. { signed integer registers }
  3427. OS_8:
  3428. oppostfix:=PF_B;
  3429. OS_S8:
  3430. oppostfix:=PF_SB;
  3431. OS_16:
  3432. oppostfix:=PF_H;
  3433. OS_S16:
  3434. oppostfix:=PF_SH;
  3435. OS_32,
  3436. OS_S32:
  3437. oppostfix:=PF_None;
  3438. else
  3439. InternalError(200308298);
  3440. end;
  3441. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3442. begin
  3443. if target_info.endian=endian_big then
  3444. dir:=-1
  3445. else
  3446. dir:=1;
  3447. case FromSize of
  3448. OS_16,OS_S16:
  3449. begin
  3450. { only complicated references need an extra loadaddr }
  3451. if assigned(ref.symbol) or
  3452. (ref.index<>NR_NO) or
  3453. (ref.offset<-124) or
  3454. (ref.offset>124) or
  3455. { sometimes the compiler reused registers }
  3456. (reg=ref.index) or
  3457. (reg=ref.base) then
  3458. begin
  3459. tmpreg2:=getintregister(list,OS_INT);
  3460. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3461. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3462. end
  3463. else
  3464. usedtmpref:=ref;
  3465. if target_info.endian=endian_big then
  3466. inc(usedtmpref.offset,1);
  3467. tmpreg:=getintregister(list,OS_INT);
  3468. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3469. inc(usedtmpref.offset,dir);
  3470. if FromSize=OS_16 then
  3471. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3472. else
  3473. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3474. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3475. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3476. end;
  3477. OS_32,OS_S32:
  3478. begin
  3479. tmpreg:=getintregister(list,OS_INT);
  3480. { only complicated references need an extra loadaddr }
  3481. if assigned(ref.symbol) or
  3482. (ref.index<>NR_NO) or
  3483. (ref.offset<-124) or
  3484. (ref.offset>124) or
  3485. { sometimes the compiler reused registers }
  3486. (reg=ref.index) or
  3487. (reg=ref.base) then
  3488. begin
  3489. tmpreg2:=getintregister(list,OS_INT);
  3490. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3491. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3492. end
  3493. else
  3494. usedtmpref:=ref;
  3495. if ref.alignment=2 then
  3496. begin
  3497. if target_info.endian=endian_big then
  3498. inc(usedtmpref.offset,2);
  3499. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  3500. inc(usedtmpref.offset,dir*2);
  3501. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  3502. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3503. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3504. end
  3505. else
  3506. begin
  3507. if target_info.endian=endian_big then
  3508. inc(usedtmpref.offset,3);
  3509. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3510. inc(usedtmpref.offset,dir);
  3511. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3512. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,8));
  3513. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3514. inc(usedtmpref.offset,dir);
  3515. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3516. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,16));
  3517. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3518. inc(usedtmpref.offset,dir);
  3519. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  3520. list.concat(taicpu.op_reg_const(A_LSL,tmpreg,24));
  3521. list.concat(taicpu.op_reg_reg(A_ORR,reg,tmpreg));
  3522. end;
  3523. end
  3524. else
  3525. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3526. end;
  3527. end
  3528. else
  3529. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  3530. if (fromsize=OS_S8) and (tosize = OS_16) then
  3531. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  3532. end;
  3533. procedure tthumbcgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3534. var
  3535. imm_shift : byte;
  3536. l : tasmlabel;
  3537. hr : treference;
  3538. begin
  3539. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3540. internalerror(2002090902);
  3541. if is_thumb_imm(a) then
  3542. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3543. else
  3544. begin
  3545. reference_reset(hr,4);
  3546. current_asmdata.getjumplabel(l);
  3547. cg.a_label(current_procinfo.aktlocaldata,l);
  3548. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3549. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3550. hr.symbol:=l;
  3551. hr.base:=NR_PC;
  3552. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3553. end;
  3554. end;
  3555. procedure tthumbcgarm.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);
  3556. var
  3557. hsym : tsym;
  3558. href,
  3559. tmpref : treference;
  3560. paraloc : Pcgparalocation;
  3561. l : TAsmLabel;
  3562. begin
  3563. { calculate the parameter info for the procdef }
  3564. procdef.init_paraloc_info(callerside);
  3565. hsym:=tsym(procdef.parast.Find('self'));
  3566. if not(assigned(hsym) and
  3567. (hsym.typ=paravarsym)) then
  3568. internalerror(200305251);
  3569. paraloc:=tparavarsym(hsym).paraloc[callerside].location;
  3570. while paraloc<>nil do
  3571. with paraloc^ do
  3572. begin
  3573. case loc of
  3574. LOC_REGISTER:
  3575. begin
  3576. if is_thumb_imm(ioffset) then
  3577. a_op_const_reg(list,OP_SUB,size,ioffset,register)
  3578. else
  3579. begin
  3580. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3581. reference_reset(tmpref,4);
  3582. current_asmdata.getjumplabel(l);
  3583. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3584. cg.a_label(current_procinfo.aktlocaldata,l);
  3585. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3586. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3587. tmpref.symbol:=l;
  3588. tmpref.base:=NR_PC;
  3589. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3590. a_op_reg_reg(list,OP_SUB,size,NR_R4,register);
  3591. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3592. end;
  3593. end;
  3594. LOC_REFERENCE:
  3595. begin
  3596. { offset in the wrapper needs to be adjusted for the stored
  3597. return address }
  3598. reference_reset_base(href,reference.index,reference.offset+sizeof(aint),sizeof(pint));
  3599. if is_thumb_imm(ioffset) then
  3600. a_op_const_ref(list,OP_SUB,size,ioffset,href)
  3601. else
  3602. begin
  3603. list.concat(taicpu.op_regset(A_PUSH,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3604. reference_reset(tmpref,4);
  3605. current_asmdata.getjumplabel(l);
  3606. current_procinfo.aktlocaldata.Concat(tai_align.Create(4));
  3607. cg.a_label(current_procinfo.aktlocaldata,l);
  3608. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  3609. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ioffset));
  3610. tmpref.symbol:=l;
  3611. tmpref.base:=NR_PC;
  3612. list.concat(taicpu.op_reg_ref(A_LDR,NR_R4,tmpref));
  3613. a_op_reg_ref(list,OP_SUB,size,NR_R4,href);
  3614. list.concat(taicpu.op_regset(A_POP,R_INTREGISTER,R_SUBWHOLE,[RS_R4]));
  3615. end;
  3616. end
  3617. else
  3618. internalerror(200309189);
  3619. end;
  3620. paraloc:=next;
  3621. end;
  3622. end;
  3623. function tthumbcgarm.handle_load_store(list: TAsmList; op: tasmop; oppostfix: toppostfix; reg: tregister; ref: treference): treference;
  3624. var
  3625. href : treference;
  3626. tmpreg : TRegister;
  3627. begin
  3628. href:=ref;
  3629. if { LDR/STR limitations }
  3630. (
  3631. (((op=A_LDR) and (oppostfix=PF_None)) or
  3632. ((op=A_STR) and (oppostfix=PF_None))) and
  3633. (ref.base<>NR_STACK_POINTER_REG) and
  3634. (abs(ref.offset)>124)
  3635. ) or
  3636. { LDRB/STRB limitations }
  3637. (
  3638. (((op=A_LDR) and (oppostfix=PF_B)) or
  3639. ((op=A_LDRB) and (oppostfix=PF_None)) or
  3640. ((op=A_STR) and (oppostfix=PF_B)) or
  3641. ((op=A_STRB) and (oppostfix=PF_None))) and
  3642. ((ref.base=NR_STACK_POINTER_REG) or
  3643. (ref.index=NR_STACK_POINTER_REG) or
  3644. (abs(ref.offset)>31)
  3645. )
  3646. ) or
  3647. { LDRH/STRH limitations }
  3648. (
  3649. (((op=A_LDR) and (oppostfix=PF_H)) or
  3650. ((op=A_LDRH) and (oppostfix=PF_None)) or
  3651. ((op=A_STR) and (oppostfix=PF_H)) or
  3652. ((op=A_STRH) and (oppostfix=PF_None))) and
  3653. ((ref.base=NR_STACK_POINTER_REG) or
  3654. (ref.index=NR_STACK_POINTER_REG) or
  3655. (abs(ref.offset)>62) or
  3656. ((abs(ref.offset) mod 2)<>0)
  3657. )
  3658. ) then
  3659. begin
  3660. tmpreg:=getintregister(list,OS_ADDR);
  3661. a_loadaddr_ref_reg(list,ref,tmpreg);
  3662. reference_reset_base(href,tmpreg,0,ref.alignment);
  3663. end
  3664. else if (op=A_LDR) and
  3665. (oppostfix in [PF_None]) and
  3666. (ref.base=NR_STACK_POINTER_REG) and
  3667. (abs(ref.offset)>1020) then
  3668. begin
  3669. tmpreg:=getintregister(list,OS_ADDR);
  3670. a_loadaddr_ref_reg(list,ref,tmpreg);
  3671. reference_reset_base(href,tmpreg,0,ref.alignment);
  3672. end
  3673. else if (op=A_LDR) and
  3674. ((oppostfix in [PF_SH,PF_SB]) or
  3675. (abs(ref.offset)>124)) then
  3676. begin
  3677. tmpreg:=getintregister(list,OS_ADDR);
  3678. a_loadaddr_ref_reg(list,ref,tmpreg);
  3679. reference_reset_base(href,tmpreg,0,ref.alignment);
  3680. end;
  3681. Result:=inherited handle_load_store(list, op, oppostfix, reg, href);
  3682. end;
  3683. procedure tthumbcgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  3684. var
  3685. tmpreg,overflowreg : tregister;
  3686. asmop : tasmop;
  3687. begin
  3688. case op of
  3689. OP_NEG:
  3690. list.concat(taicpu.op_reg_reg(A_NEG,dst,src));
  3691. OP_NOT:
  3692. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  3693. OP_DIV,OP_IDIV:
  3694. internalerror(200308284);
  3695. OP_ROL:
  3696. begin
  3697. if not(size in [OS_32,OS_S32]) then
  3698. internalerror(2008072801);
  3699. { simulate ROL by ror'ing 32-value }
  3700. tmpreg:=getintregister(list,OS_32);
  3701. a_load_const_reg(list,OS_32,32,tmpreg);
  3702. list.concat(taicpu.op_reg_reg(A_SUB,tmpreg,src));
  3703. list.concat(taicpu.op_reg_reg(A_ROR,dst,src));
  3704. end;
  3705. else
  3706. begin
  3707. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3708. list.concat(setoppostfix(
  3709. taicpu.op_reg_reg(op_reg_opcg2asmop[op],dst,src),op_reg_postfix[op]));
  3710. end;
  3711. end;
  3712. maybeadjustresult(list,op,size,dst);
  3713. end;
  3714. procedure tthumbcgarm.a_op_const_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; dst: tregister);
  3715. var
  3716. tmpreg : tregister;
  3717. so : tshifterop;
  3718. l1 : longint;
  3719. imm1, imm2: DWord;
  3720. begin
  3721. //!!! ovloc.loc:=LOC_VOID;
  3722. if {$ifopt R+}(a<>-2147483648) and{$endif} {!!!!!! not setflags and } is_thumb_imm(-a) then
  3723. case op of
  3724. OP_ADD:
  3725. begin
  3726. op:=OP_SUB;
  3727. a:=aint(dword(-a));
  3728. end;
  3729. OP_SUB:
  3730. begin
  3731. op:=OP_ADD;
  3732. a:=aint(dword(-a));
  3733. end
  3734. end;
  3735. if is_thumb_imm(a) and (op in [OP_ADD,OP_SUB]) then
  3736. begin
  3737. // if cgsetflags or setflags then
  3738. a_reg_alloc(list,NR_DEFAULTFLAGS);
  3739. list.concat(setoppostfix(
  3740. taicpu.op_reg_const(op_reg_opcg2asmop[op],dst,a),op_reg_postfix[op]));
  3741. if (cgsetflags {!!! or setflags }) and (size in [OS_8,OS_16,OS_32]) then
  3742. begin
  3743. //!!! ovloc.loc:=LOC_FLAGS;
  3744. case op of
  3745. OP_ADD:
  3746. //!!! ovloc.resflags:=F_CS;
  3747. ;
  3748. OP_SUB:
  3749. //!!! ovloc.resflags:=F_CC;
  3750. ;
  3751. end;
  3752. end;
  3753. end
  3754. else
  3755. begin
  3756. { there could be added some more sophisticated optimizations }
  3757. if (op in [OP_MUL,OP_IMUL,OP_DIV,OP_IDIV]) and (a=1) then
  3758. a_load_reg_reg(list,size,size,dst,dst)
  3759. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  3760. a_load_const_reg(list,size,0,dst)
  3761. else if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  3762. a_op_reg_reg(list,OP_NEG,size,dst,dst)
  3763. { we do this here instead in the peephole optimizer because
  3764. it saves us a register }
  3765. {$ifdef DUMMY}
  3766. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  3767. a_op_const_reg_reg(list,OP_SHL,size,l1,dst,dst)
  3768. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  3769. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  3770. begin
  3771. if l1>32 then{roozbeh does this ever happen?}
  3772. internalerror(200308296);
  3773. shifterop_reset(so);
  3774. so.shiftmode:=SM_LSL;
  3775. so.shiftimm:=l1;
  3776. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,dst,dst,so));
  3777. end
  3778. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  3779. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  3780. begin
  3781. if l1>32 then{does this ever happen?}
  3782. internalerror(201205181);
  3783. shifterop_reset(so);
  3784. so.shiftmode:=SM_LSL;
  3785. so.shiftimm:=l1;
  3786. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,dst,dst,so));
  3787. end
  3788. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,dst,dst) then
  3789. begin
  3790. { nothing to do on success }
  3791. end
  3792. {$endif DUMMY}
  3793. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  3794. Just using mov x, #0 might allow some easier optimizations down the line. }
  3795. else if (op = OP_AND) and (dword(a)=0) then
  3796. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  3797. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  3798. else if (op = OP_AND) and (not(dword(a))=0) then
  3799. // do nothing
  3800. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  3801. broader range of shifterconstants.}
  3802. {$ifdef DUMMY}
  3803. else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  3804. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,not(dword(a))))
  3805. else if (op = OP_AND) and split_into_shifter_const(not(dword(a)), imm1, imm2) then
  3806. begin
  3807. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm1));
  3808. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,dst,imm2));
  3809. end
  3810. else if (op in [OP_ADD, OP_SUB, OP_OR]) and
  3811. not(cgsetflags or setflags) and
  3812. split_into_shifter_const(a, imm1, imm2) then
  3813. begin
  3814. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm1));
  3815. list.concat(taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,dst,imm2));
  3816. end
  3817. {$endif DUMMY}
  3818. else if (op in [OP_SHL, OP_SHR, OP_SAR]) then
  3819. begin
  3820. list.concat(taicpu.op_reg_reg_const(op_reg_opcg2asmop[op],dst,dst,a));
  3821. end
  3822. else
  3823. begin
  3824. tmpreg:=getintregister(list,size);
  3825. a_load_const_reg(list,size,a,tmpreg);
  3826. a_op_reg_reg(list,op,size,tmpreg,dst);
  3827. end;
  3828. end;
  3829. maybeadjustresult(list,op,size,dst);
  3830. end;
  3831. procedure tthumbcgarm.a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister);
  3832. begin
  3833. if (op=OP_ADD) and (src=NR_R13) and (dst<>NR_R13) and ((a mod 4)=0) and (a>0) and (a<=1020) then
  3834. list.concat(taicpu.op_reg_reg_const(A_ADD,dst,src,a))
  3835. else
  3836. inherited a_op_const_reg_reg(list,op,size,a,src,dst);
  3837. end;
  3838. procedure tthumbcgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  3839. var
  3840. l1,l2 : tasmlabel;
  3841. ai : taicpu;
  3842. begin
  3843. current_asmdata.getjumplabel(l1);
  3844. current_asmdata.getjumplabel(l2);
  3845. ai:=setcondition(taicpu.op_sym(A_B,l1),flags_to_cond(f));
  3846. ai.is_jmp:=true;
  3847. list.concat(ai);
  3848. list.concat(taicpu.op_reg_const(A_MOV,reg,0));
  3849. list.concat(taicpu.op_sym(A_B,l2));
  3850. cg.a_label(list,l1);
  3851. list.concat(taicpu.op_reg_const(A_MOV,reg,1));
  3852. a_reg_dealloc(list,NR_DEFAULTFLAGS);
  3853. cg.a_label(list,l2);
  3854. end;
  3855. procedure tthumb2cgarm.init_register_allocators;
  3856. begin
  3857. inherited init_register_allocators;
  3858. { currently, we save R14 always, so we can use it }
  3859. if (target_info.system<>system_arm_darwin) then
  3860. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3861. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3862. RS_R9,RS_R10,RS_R12,RS_R14],first_int_imreg,[])
  3863. else
  3864. { r9 is not available on Darwin according to the llvm code generator }
  3865. rg[R_INTREGISTER]:=trgintcputhumb2.create(R_INTREGISTER,R_SUBWHOLE,
  3866. [RS_R0,RS_R1,RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,
  3867. RS_R10,RS_R12,RS_R14],first_int_imreg,[]);
  3868. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  3869. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7],first_fpu_imreg,[]);
  3870. if current_settings.fputype=fpu_vfpv3 then
  3871. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3872. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3873. RS_D16,RS_D17,RS_D18,RS_D19,RS_D20,RS_D21,RS_D22,RS_D23,RS_D24,RS_D25,RS_D26,RS_D27,RS_D28,RS_D29,RS_D30,RS_D31,
  3874. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3875. ],first_mm_imreg,[])
  3876. else if current_settings.fputype in [fpu_fpv4_s16,fpu_vfpv3_d16] then
  3877. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBFD,
  3878. [RS_D0,RS_D1,RS_D2,RS_D3,RS_D4,RS_D5,RS_D6,RS_D7,
  3879. RS_D8,RS_D9,RS_D10,RS_D11,RS_D12,RS_D13,RS_D14,RS_D15
  3880. ],first_mm_imreg,[])
  3881. else
  3882. rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBNONE,
  3883. [RS_S0,RS_S1,RS_R2,RS_R3,RS_R4,RS_S31],first_mm_imreg,[]);
  3884. end;
  3885. procedure tthumb2cgarm.done_register_allocators;
  3886. begin
  3887. rg[R_INTREGISTER].free;
  3888. rg[R_FPUREGISTER].free;
  3889. rg[R_MMREGISTER].free;
  3890. inherited done_register_allocators;
  3891. end;
  3892. procedure tthumb2cgarm.a_call_reg(list : TAsmList;reg: tregister);
  3893. begin
  3894. list.concat(taicpu.op_reg(A_BLX, reg));
  3895. {
  3896. the compiler does not properly set this flag anymore in pass 1, and
  3897. for now we only need it after pass 2 (I hope) (JM)
  3898. if not(pi_do_call in current_procinfo.flags) then
  3899. internalerror(2003060703);
  3900. }
  3901. include(current_procinfo.flags,pi_do_call);
  3902. end;
  3903. procedure tthumb2cgarm.a_load_const_reg(list : TAsmList; size: tcgsize; a : tcgint;reg : tregister);
  3904. var
  3905. imm_shift : byte;
  3906. l : tasmlabel;
  3907. hr : treference;
  3908. begin
  3909. if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then
  3910. internalerror(2002090902);
  3911. if is_thumb32_imm(a) then
  3912. list.concat(taicpu.op_reg_const(A_MOV,reg,a))
  3913. else if is_thumb32_imm(not(a)) then
  3914. list.concat(taicpu.op_reg_const(A_MVN,reg,not(a)))
  3915. else if (a and $FFFF)=a then
  3916. list.concat(taicpu.op_reg_const(A_MOVW,reg,a))
  3917. else
  3918. begin
  3919. reference_reset(hr,4);
  3920. current_asmdata.getjumplabel(l);
  3921. cg.a_label(current_procinfo.aktlocaldata,l);
  3922. hr.symboldata:=current_procinfo.aktlocaldata.last;
  3923. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  3924. hr.symbol:=l;
  3925. hr.base:=NR_PC;
  3926. list.concat(taicpu.op_reg_ref(A_LDR,reg,hr));
  3927. end;
  3928. end;
  3929. procedure tthumb2cgarm.a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);
  3930. var
  3931. oppostfix:toppostfix;
  3932. usedtmpref: treference;
  3933. tmpreg,tmpreg2 : tregister;
  3934. so : tshifterop;
  3935. dir : integer;
  3936. begin
  3937. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  3938. FromSize := ToSize;
  3939. case FromSize of
  3940. { signed integer registers }
  3941. OS_8:
  3942. oppostfix:=PF_B;
  3943. OS_S8:
  3944. oppostfix:=PF_SB;
  3945. OS_16:
  3946. oppostfix:=PF_H;
  3947. OS_S16:
  3948. oppostfix:=PF_SH;
  3949. OS_32,
  3950. OS_S32:
  3951. oppostfix:=PF_None;
  3952. else
  3953. InternalError(200308299);
  3954. end;
  3955. if (ref.alignment in [1,2]) and (ref.alignment<tcgsize2size[fromsize]) then
  3956. begin
  3957. if target_info.endian=endian_big then
  3958. dir:=-1
  3959. else
  3960. dir:=1;
  3961. case FromSize of
  3962. OS_16,OS_S16:
  3963. begin
  3964. { only complicated references need an extra loadaddr }
  3965. if assigned(ref.symbol) or
  3966. (ref.index<>NR_NO) or
  3967. (ref.offset<-255) or
  3968. (ref.offset>4094) or
  3969. { sometimes the compiler reused registers }
  3970. (reg=ref.index) or
  3971. (reg=ref.base) then
  3972. begin
  3973. tmpreg2:=getintregister(list,OS_INT);
  3974. a_loadaddr_ref_reg(list,ref,tmpreg2);
  3975. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  3976. end
  3977. else
  3978. usedtmpref:=ref;
  3979. if target_info.endian=endian_big then
  3980. inc(usedtmpref.offset,1);
  3981. shifterop_reset(so);so.shiftmode:=SM_LSL;so.shiftimm:=8;
  3982. tmpreg:=getintregister(list,OS_INT);
  3983. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  3984. inc(usedtmpref.offset,dir);
  3985. if FromSize=OS_16 then
  3986. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg)
  3987. else
  3988. a_internal_load_ref_reg(list,OS_S8,OS_S8,usedtmpref,tmpreg);
  3989. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  3990. end;
  3991. OS_32,OS_S32:
  3992. begin
  3993. tmpreg:=getintregister(list,OS_INT);
  3994. { only complicated references need an extra loadaddr }
  3995. if assigned(ref.symbol) or
  3996. (ref.index<>NR_NO) or
  3997. (ref.offset<-255) or
  3998. (ref.offset>4092) or
  3999. { sometimes the compiler reused registers }
  4000. (reg=ref.index) or
  4001. (reg=ref.base) then
  4002. begin
  4003. tmpreg2:=getintregister(list,OS_INT);
  4004. a_loadaddr_ref_reg(list,ref,tmpreg2);
  4005. reference_reset_base(usedtmpref,tmpreg2,0,ref.alignment);
  4006. end
  4007. else
  4008. usedtmpref:=ref;
  4009. shifterop_reset(so);so.shiftmode:=SM_LSL;
  4010. if ref.alignment=2 then
  4011. begin
  4012. if target_info.endian=endian_big then
  4013. inc(usedtmpref.offset,2);
  4014. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,reg);
  4015. inc(usedtmpref.offset,dir*2);
  4016. a_internal_load_ref_reg(list,OS_16,OS_16,usedtmpref,tmpreg);
  4017. so.shiftimm:=16;
  4018. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4019. end
  4020. else
  4021. begin
  4022. if target_info.endian=endian_big then
  4023. inc(usedtmpref.offset,3);
  4024. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,reg);
  4025. inc(usedtmpref.offset,dir);
  4026. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4027. so.shiftimm:=8;
  4028. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4029. inc(usedtmpref.offset,dir);
  4030. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4031. so.shiftimm:=16;
  4032. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4033. inc(usedtmpref.offset,dir);
  4034. a_internal_load_ref_reg(list,OS_8,OS_8,usedtmpref,tmpreg);
  4035. so.shiftimm:=24;
  4036. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ORR,reg,reg,tmpreg,so));
  4037. end;
  4038. end
  4039. else
  4040. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4041. end;
  4042. end
  4043. else
  4044. handle_load_store(list,A_LDR,oppostfix,reg,ref);
  4045. if (fromsize=OS_S8) and (tosize = OS_16) then
  4046. a_load_reg_reg(list,OS_16,OS_32,reg,reg);
  4047. end;
  4048. procedure tthumb2cgarm.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);
  4049. begin
  4050. if op = OP_NOT then
  4051. begin
  4052. list.concat(taicpu.op_reg_reg(A_MVN,dst,src));
  4053. case size of
  4054. OS_8: list.concat(taicpu.op_reg_reg(A_UXTB,dst,dst));
  4055. OS_S8: list.concat(taicpu.op_reg_reg(A_SXTB,dst,dst));
  4056. OS_16: list.concat(taicpu.op_reg_reg(A_UXTH,dst,dst));
  4057. OS_S16: list.concat(taicpu.op_reg_reg(A_SXTH,dst,dst));
  4058. end;
  4059. end
  4060. else
  4061. inherited a_op_reg_reg(list, op, size, src, dst);
  4062. end;
  4063. procedure tthumb2cgarm.a_op_const_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4064. var
  4065. shift, width : byte;
  4066. tmpreg : tregister;
  4067. so : tshifterop;
  4068. l1 : longint;
  4069. begin
  4070. ovloc.loc:=LOC_VOID;
  4071. if {$ifopt R+}(a<>-2147483648) and{$endif} is_shifter_const(-a,shift) then
  4072. case op of
  4073. OP_ADD:
  4074. begin
  4075. op:=OP_SUB;
  4076. a:=aint(dword(-a));
  4077. end;
  4078. OP_SUB:
  4079. begin
  4080. op:=OP_ADD;
  4081. a:=aint(dword(-a));
  4082. end
  4083. end;
  4084. if is_shifter_const(a,shift) and not(op in [OP_IMUL,OP_MUL]) then
  4085. case op of
  4086. OP_NEG,OP_NOT,
  4087. OP_DIV,OP_IDIV:
  4088. internalerror(200308285);
  4089. OP_SHL:
  4090. begin
  4091. if a>32 then
  4092. internalerror(2014020703);
  4093. if a<>0 then
  4094. begin
  4095. shifterop_reset(so);
  4096. so.shiftmode:=SM_LSL;
  4097. so.shiftimm:=a;
  4098. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4099. end
  4100. else
  4101. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4102. end;
  4103. OP_ROL:
  4104. begin
  4105. if a>32 then
  4106. internalerror(2014020704);
  4107. if a<>0 then
  4108. begin
  4109. shifterop_reset(so);
  4110. so.shiftmode:=SM_ROR;
  4111. so.shiftimm:=32-a;
  4112. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4113. end
  4114. else
  4115. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4116. end;
  4117. OP_ROR:
  4118. begin
  4119. if a>32 then
  4120. internalerror(2014020705);
  4121. if a<>0 then
  4122. begin
  4123. shifterop_reset(so);
  4124. so.shiftmode:=SM_ROR;
  4125. so.shiftimm:=a;
  4126. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4127. end
  4128. else
  4129. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4130. end;
  4131. OP_SHR:
  4132. begin
  4133. if a>32 then
  4134. internalerror(200308292);
  4135. shifterop_reset(so);
  4136. if a<>0 then
  4137. begin
  4138. so.shiftmode:=SM_LSR;
  4139. so.shiftimm:=a;
  4140. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4141. end
  4142. else
  4143. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4144. end;
  4145. OP_SAR:
  4146. begin
  4147. if a>32 then
  4148. internalerror(200308295);
  4149. if a<>0 then
  4150. begin
  4151. shifterop_reset(so);
  4152. so.shiftmode:=SM_ASR;
  4153. so.shiftimm:=a;
  4154. list.concat(taicpu.op_reg_reg_shifterop(A_MOV,dst,src,so));
  4155. end
  4156. else
  4157. list.concat(taicpu.op_reg_reg(A_MOV,dst,src));
  4158. end;
  4159. else
  4160. if (op in [OP_SUB, OP_ADD]) and
  4161. ((a < 0) or
  4162. (a > 4095)) then
  4163. begin
  4164. tmpreg:=getintregister(list,size);
  4165. a_load_const_reg(list, size, a, tmpreg);
  4166. if cgsetflags or setflags then
  4167. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4168. list.concat(setoppostfix(
  4169. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src,tmpreg),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4170. end
  4171. else
  4172. begin
  4173. if cgsetflags or setflags then
  4174. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4175. list.concat(setoppostfix(
  4176. taicpu.op_reg_reg_const(op_reg_reg_opcg2asmop[op],dst,src,a),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4177. end;
  4178. if (cgsetflags or setflags) and (size in [OS_8,OS_16,OS_32]) then
  4179. begin
  4180. ovloc.loc:=LOC_FLAGS;
  4181. case op of
  4182. OP_ADD:
  4183. ovloc.resflags:=F_CS;
  4184. OP_SUB:
  4185. ovloc.resflags:=F_CC;
  4186. end;
  4187. end;
  4188. end
  4189. else
  4190. begin
  4191. { there could be added some more sophisticated optimizations }
  4192. if (op in [OP_MUL,OP_IMUL]) and (a=1) then
  4193. a_load_reg_reg(list,size,size,src,dst)
  4194. else if (op in [OP_MUL,OP_IMUL]) and (a=0) then
  4195. a_load_const_reg(list,size,0,dst)
  4196. else if (op in [OP_IMUL]) and (a=-1) then
  4197. a_op_reg_reg(list,OP_NEG,size,src,dst)
  4198. { we do this here instead in the peephole optimizer because
  4199. it saves us a register }
  4200. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) and not(cgsetflags or setflags) then
  4201. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  4202. { for example : b=a*5 -> b=a*4+a with add instruction and shl }
  4203. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a-1,l1) and not(cgsetflags or setflags) then
  4204. begin
  4205. if l1>32 then{roozbeh does this ever happen?}
  4206. internalerror(200308296);
  4207. shifterop_reset(so);
  4208. so.shiftmode:=SM_LSL;
  4209. so.shiftimm:=l1;
  4210. list.concat(taicpu.op_reg_reg_reg_shifterop(A_ADD,dst,src,src,so));
  4211. end
  4212. { for example : b=a*7 -> b=a*8-a with rsb instruction and shl }
  4213. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a+1,l1) and not(cgsetflags or setflags) then
  4214. begin
  4215. if l1>32 then{does this ever happen?}
  4216. internalerror(201205181);
  4217. shifterop_reset(so);
  4218. so.shiftmode:=SM_LSL;
  4219. so.shiftimm:=l1;
  4220. list.concat(taicpu.op_reg_reg_reg_shifterop(A_RSB,dst,src,src,so));
  4221. end
  4222. else if (op in [OP_MUL,OP_IMUL]) and not(cgsetflags or setflags) and try_optimized_mul32_const_reg_reg(list,a,src,dst) then
  4223. begin
  4224. { nothing to do on success }
  4225. end
  4226. { x := y and 0; just clears a register, this sometimes gets generated on 64bit ops.
  4227. Just using mov x, #0 might allow some easier optimizations down the line. }
  4228. else if (op = OP_AND) and (dword(a)=0) then
  4229. list.concat(taicpu.op_reg_const(A_MOV,dst,0))
  4230. { x := y AND $FFFFFFFF just copies the register, so use mov for better optimizations }
  4231. else if (op = OP_AND) and (not(dword(a))=0) then
  4232. list.concat(taicpu.op_reg_reg(A_MOV,dst,src))
  4233. { BIC clears the specified bits, while AND keeps them, using BIC allows to use a
  4234. broader range of shifterconstants.}
  4235. {else if (op = OP_AND) and is_shifter_const(not(dword(a)),shift) then
  4236. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))}
  4237. else if (op = OP_AND) and is_thumb32_imm(a) then
  4238. list.concat(taicpu.op_reg_reg_const(A_AND,dst,src,dword(a)))
  4239. else if (op = OP_AND) and (a = $FFFF) then
  4240. list.concat(taicpu.op_reg_reg(A_UXTH,dst,src))
  4241. else if (op = OP_AND) and is_thumb32_imm(not(dword(a))) then
  4242. list.concat(taicpu.op_reg_reg_const(A_BIC,dst,src,not(dword(a))))
  4243. else if (op = OP_AND) and is_continuous_mask(not(a), shift, width) then
  4244. begin
  4245. a_load_reg_reg(list,size,size,src,dst);
  4246. list.concat(taicpu.op_reg_const_const(A_BFC,dst,shift,width))
  4247. end
  4248. else
  4249. begin
  4250. tmpreg:=getintregister(list,size);
  4251. a_load_const_reg(list,size,a,tmpreg);
  4252. a_op_reg_reg_reg_checkoverflow(list,op,size,tmpreg,src,dst,setflags,ovloc);
  4253. end;
  4254. end;
  4255. maybeadjustresult(list,op,size,dst);
  4256. end;
  4257. const
  4258. op_reg_reg_opcg2asmopThumb2: array[TOpCG] of tasmop =
  4259. (A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NONE,A_MVN,A_ORR,
  4260. A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR);
  4261. procedure tthumb2cgarm.a_op_reg_reg_reg_checkoverflow(list: TAsmList; op: TOpCg; size: tcgsize; src1, src2, dst: tregister;setflags : boolean;var ovloc : tlocation);
  4262. var
  4263. so : tshifterop;
  4264. tmpreg,overflowreg : tregister;
  4265. asmop : tasmop;
  4266. begin
  4267. ovloc.loc:=LOC_VOID;
  4268. case op of
  4269. OP_NEG,OP_NOT:
  4270. internalerror(200308286);
  4271. OP_ROL:
  4272. begin
  4273. if not(size in [OS_32,OS_S32]) then
  4274. internalerror(2008072801);
  4275. { simulate ROL by ror'ing 32-value }
  4276. tmpreg:=getintregister(list,OS_32);
  4277. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,32));
  4278. list.concat(taicpu.op_reg_reg_reg(A_SUB,src1,tmpreg,src1));
  4279. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4280. end;
  4281. OP_ROR:
  4282. begin
  4283. if not(size in [OS_32,OS_S32]) then
  4284. internalerror(2008072802);
  4285. list.concat(taicpu.op_reg_reg_reg(A_ROR, dst, src2, src1));
  4286. end;
  4287. OP_IMUL,
  4288. OP_MUL:
  4289. begin
  4290. if cgsetflags or setflags then
  4291. begin
  4292. overflowreg:=getintregister(list,size);
  4293. if op=OP_IMUL then
  4294. asmop:=A_SMULL
  4295. else
  4296. asmop:=A_UMULL;
  4297. { the arm doesn't allow that rd and rm are the same }
  4298. if dst=src2 then
  4299. begin
  4300. if dst<>src1 then
  4301. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src1,src2))
  4302. else
  4303. begin
  4304. tmpreg:=getintregister(list,size);
  4305. a_load_reg_reg(list,size,size,src2,dst);
  4306. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,tmpreg,src1));
  4307. end;
  4308. end
  4309. else
  4310. list.concat(taicpu.op_reg_reg_reg_reg(asmop,dst,overflowreg,src2,src1));
  4311. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4312. if op=OP_IMUL then
  4313. begin
  4314. shifterop_reset(so);
  4315. so.shiftmode:=SM_ASR;
  4316. so.shiftimm:=31;
  4317. list.concat(taicpu.op_reg_reg_shifterop(A_CMP,overflowreg,dst,so));
  4318. end
  4319. else
  4320. list.concat(taicpu.op_reg_const(A_CMP,overflowreg,0));
  4321. ovloc.loc:=LOC_FLAGS;
  4322. ovloc.resflags:=F_NE;
  4323. end
  4324. else
  4325. begin
  4326. { the arm doesn't allow that rd and rm are the same }
  4327. if dst=src2 then
  4328. begin
  4329. if dst<>src1 then
  4330. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src1,src2))
  4331. else
  4332. begin
  4333. tmpreg:=getintregister(list,size);
  4334. a_load_reg_reg(list,size,size,src2,dst);
  4335. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,tmpreg,src1));
  4336. end;
  4337. end
  4338. else
  4339. list.concat(taicpu.op_reg_reg_reg(A_MUL,dst,src2,src1));
  4340. end;
  4341. end;
  4342. else
  4343. begin
  4344. if cgsetflags or setflags then
  4345. a_reg_alloc(list,NR_DEFAULTFLAGS);
  4346. {$ifdef dummy}
  4347. { R13 is not allowed for certain instruction operands }
  4348. if op_reg_reg_opcg2asmopThumb2[op] in [A_ADD,A_SUB,A_AND,A_BIC,A_EOR] then
  4349. begin
  4350. if getsupreg(dst)=RS_R13 then
  4351. begin
  4352. tmpreg:=getintregister(list,OS_INT);
  4353. a_load_reg_reg(list,OS_INT,OS_INT,dst,tmpreg);
  4354. dst:=tmpreg;
  4355. end;
  4356. if getsupreg(src1)=RS_R13 then
  4357. begin
  4358. tmpreg:=getintregister(list,OS_INT);
  4359. a_load_reg_reg(list,OS_INT,OS_INT,src1,tmpreg);
  4360. src1:=tmpreg;
  4361. end;
  4362. end;
  4363. {$endif}
  4364. list.concat(setoppostfix(
  4365. taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmopThumb2[op],dst,src2,src1),toppostfix(ord(cgsetflags or setflags)*ord(PF_S))));
  4366. end;
  4367. end;
  4368. maybeadjustresult(list,op,size,dst);
  4369. end;
  4370. procedure tthumb2cgarm.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);
  4371. var item: taicpu;
  4372. begin
  4373. list.concat(taicpu.op_cond(A_ITE, flags_to_cond(f)));
  4374. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,1),flags_to_cond(f)));
  4375. list.concat(setcondition(taicpu.op_reg_const(A_MOV,reg,0),inverse_cond(flags_to_cond(f))));
  4376. end;
  4377. procedure tthumb2cgarm.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);
  4378. var
  4379. ref : treference;
  4380. shift : byte;
  4381. firstfloatreg,lastfloatreg,
  4382. r : byte;
  4383. regs : tcpuregisterset;
  4384. stackmisalignment: pint;
  4385. begin
  4386. LocalSize:=align(LocalSize,4);
  4387. { call instruction does not put anything on the stack }
  4388. stackmisalignment:=0;
  4389. if not(nostackframe) then
  4390. begin
  4391. firstfloatreg:=RS_NO;
  4392. lastfloatreg:=RS_NO;
  4393. { save floating point registers? }
  4394. for r:=RS_F0 to RS_F7 do
  4395. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4396. begin
  4397. if firstfloatreg=RS_NO then
  4398. firstfloatreg:=r;
  4399. lastfloatreg:=r;
  4400. inc(stackmisalignment,12);
  4401. end;
  4402. a_reg_alloc(list,NR_STACK_POINTER_REG);
  4403. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4404. begin
  4405. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  4406. a_reg_alloc(list,NR_R12);
  4407. list.concat(taicpu.op_reg_reg(A_MOV,NR_R12,NR_STACK_POINTER_REG));
  4408. end;
  4409. { save int registers }
  4410. reference_reset(ref,4);
  4411. ref.index:=NR_STACK_POINTER_REG;
  4412. ref.addressmode:=AM_PREINDEXED;
  4413. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4414. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4415. regs:=regs+[RS_FRAME_POINTER_REG,RS_R14]
  4416. else if (regs<>[]) or (pi_do_call in current_procinfo.flags) then
  4417. include(regs,RS_R14);
  4418. if regs<>[] then
  4419. begin
  4420. for r:=RS_R0 to RS_R15 do
  4421. if (r in regs) then
  4422. inc(stackmisalignment,4);
  4423. list.concat(setoppostfix(taicpu.op_ref_regset(A_STM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4424. end;
  4425. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  4426. begin
  4427. { the framepointer now points to the saved R15, so the saved
  4428. framepointer is at R11-12 (for get_caller_frame) }
  4429. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_FRAME_POINTER_REG,NR_R12,4));
  4430. a_reg_dealloc(list,NR_R12);
  4431. end;
  4432. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4433. if (LocalSize<>0) or
  4434. ((stackmisalignment<>0) and
  4435. ((pi_do_call in current_procinfo.flags) or
  4436. (po_assembler in current_procinfo.procdef.procoptions))) then
  4437. begin
  4438. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4439. if not(is_shifter_const(localsize,shift)) then
  4440. begin
  4441. if current_procinfo.framepointer=NR_STACK_POINTER_REG then
  4442. a_reg_alloc(list,NR_R12);
  4443. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4444. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_R12));
  4445. a_reg_dealloc(list,NR_R12);
  4446. end
  4447. else
  4448. begin
  4449. a_reg_dealloc(list,NR_R12);
  4450. list.concat(taicpu.op_reg_reg_const(A_SUB,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,LocalSize));
  4451. end;
  4452. end;
  4453. if firstfloatreg<>RS_NO then
  4454. begin
  4455. reference_reset(ref,4);
  4456. if tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023 then
  4457. begin
  4458. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  4459. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4460. ref.base:=NR_R12;
  4461. end
  4462. else
  4463. begin
  4464. ref.base:=current_procinfo.framepointer;
  4465. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  4466. end;
  4467. list.concat(taicpu.op_reg_const_ref(A_SFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4468. lastfloatreg-firstfloatreg+1,ref));
  4469. end;
  4470. end;
  4471. end;
  4472. procedure tthumb2cgarm.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);
  4473. var
  4474. ref : treference;
  4475. firstfloatreg,lastfloatreg,
  4476. r : byte;
  4477. shift : byte;
  4478. regs : tcpuregisterset;
  4479. LocalSize : longint;
  4480. stackmisalignment: pint;
  4481. begin
  4482. if not(nostackframe) then
  4483. begin
  4484. stackmisalignment:=0;
  4485. { restore floating point register }
  4486. firstfloatreg:=RS_NO;
  4487. lastfloatreg:=RS_NO;
  4488. { save floating point registers? }
  4489. for r:=RS_F0 to RS_F7 do
  4490. if r in rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall) then
  4491. begin
  4492. if firstfloatreg=RS_NO then
  4493. firstfloatreg:=r;
  4494. lastfloatreg:=r;
  4495. { floating point register space is already included in
  4496. localsize below by calc_stackframe_size
  4497. inc(stackmisalignment,12);
  4498. }
  4499. end;
  4500. if firstfloatreg<>RS_NO then
  4501. begin
  4502. reference_reset(ref,4);
  4503. if tg.direction*tarmprocinfo(current_procinfo).floatregstart>=1023 then
  4504. begin
  4505. a_load_const_reg(list,OS_ADDR,-tarmprocinfo(current_procinfo).floatregstart,NR_R12);
  4506. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_R12,current_procinfo.framepointer,NR_R12));
  4507. ref.base:=NR_R12;
  4508. end
  4509. else
  4510. begin
  4511. ref.base:=current_procinfo.framepointer;
  4512. ref.offset:=tarmprocinfo(current_procinfo).floatregstart;
  4513. end;
  4514. list.concat(taicpu.op_reg_const_ref(A_LFM,newreg(R_FPUREGISTER,firstfloatreg,R_SUBWHOLE),
  4515. lastfloatreg-firstfloatreg+1,ref));
  4516. end;
  4517. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  4518. if (pi_do_call in current_procinfo.flags) or (regs<>[]) then
  4519. begin
  4520. exclude(regs,RS_R14);
  4521. include(regs,RS_R15);
  4522. end;
  4523. if (current_procinfo.framepointer<>NR_STACK_POINTER_REG) then
  4524. regs:=regs+[RS_FRAME_POINTER_REG,RS_R15];
  4525. for r:=RS_R0 to RS_R15 do
  4526. if (r in regs) then
  4527. inc(stackmisalignment,4);
  4528. stackmisalignment:=stackmisalignment mod current_settings.alignment.localalignmax;
  4529. LocalSize:=current_procinfo.calc_stackframe_size;
  4530. if (LocalSize<>0) or
  4531. ((stackmisalignment<>0) and
  4532. ((pi_do_call in current_procinfo.flags) or
  4533. (po_assembler in current_procinfo.procdef.procoptions))) then
  4534. begin
  4535. localsize:=align(localsize+stackmisalignment,current_settings.alignment.localalignmax)-stackmisalignment;
  4536. if not(is_shifter_const(LocalSize,shift)) then
  4537. begin
  4538. a_reg_alloc(list,NR_R12);
  4539. a_load_const_reg(list,OS_ADDR,LocalSize,NR_R12);
  4540. list.concat(taicpu.op_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_R12));
  4541. a_reg_dealloc(list,NR_R12);
  4542. end
  4543. else
  4544. begin
  4545. a_reg_dealloc(list,NR_R12);
  4546. list.concat(taicpu.op_reg_const(A_ADD,NR_STACK_POINTER_REG,LocalSize));
  4547. end;
  4548. end;
  4549. if regs=[] then
  4550. list.concat(taicpu.op_reg_reg(A_MOV,NR_R15,NR_R14))
  4551. else
  4552. begin
  4553. reference_reset(ref,4);
  4554. ref.index:=NR_STACK_POINTER_REG;
  4555. ref.addressmode:=AM_PREINDEXED;
  4556. list.concat(setoppostfix(taicpu.op_ref_regset(A_LDM,ref,R_INTREGISTER,R_SUBWHOLE,regs),PF_FD));
  4557. end;
  4558. end
  4559. else
  4560. list.concat(taicpu.op_reg_reg(A_MOV,NR_PC,NR_R14));
  4561. end;
  4562. function tthumb2cgarm.handle_load_store(list:TAsmList;op: tasmop;oppostfix : toppostfix;reg:tregister;ref: treference):treference;
  4563. var
  4564. tmpreg : tregister;
  4565. tmpref : treference;
  4566. l : tasmlabel;
  4567. so: tshifterop;
  4568. begin
  4569. tmpreg:=NR_NO;
  4570. { Be sure to have a base register }
  4571. if (ref.base=NR_NO) then
  4572. begin
  4573. if ref.shiftmode<>SM_None then
  4574. internalerror(2014020706);
  4575. ref.base:=ref.index;
  4576. ref.index:=NR_NO;
  4577. end;
  4578. { absolute symbols can't be handled directly, we've to store the symbol reference
  4579. in the text segment and access it pc relative
  4580. For now, we assume that references where base or index equals to PC are already
  4581. relative, all other references are assumed to be absolute and thus they need
  4582. to be handled extra.
  4583. A proper solution would be to change refoptions to a set and store the information
  4584. if the symbol is absolute or relative there.
  4585. }
  4586. if (assigned(ref.symbol) and
  4587. not(is_pc(ref.base)) and
  4588. not(is_pc(ref.index))
  4589. ) or
  4590. { [#xxx] isn't a valid address operand }
  4591. ((ref.base=NR_NO) and (ref.index=NR_NO)) or
  4592. //(ref.offset<-4095) or
  4593. (ref.offset<-255) or
  4594. (ref.offset>4095) or
  4595. ((oppostfix in [PF_SB,PF_H,PF_SH]) and
  4596. ((ref.offset<-255) or
  4597. (ref.offset>255)
  4598. )
  4599. ) or
  4600. (((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and
  4601. ((ref.offset<-1020) or
  4602. (ref.offset>1020) or
  4603. ((abs(ref.offset) mod 4)<>0) or
  4604. { the usual pc relative symbol handling assumes possible offsets of +/- 4095 }
  4605. assigned(ref.symbol)
  4606. )
  4607. ) then
  4608. begin
  4609. reference_reset(tmpref,4);
  4610. { load symbol }
  4611. tmpreg:=getintregister(list,OS_INT);
  4612. if assigned(ref.symbol) then
  4613. begin
  4614. current_asmdata.getjumplabel(l);
  4615. cg.a_label(current_procinfo.aktlocaldata,l);
  4616. tmpref.symboldata:=current_procinfo.aktlocaldata.last;
  4617. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset));
  4618. { load consts entry }
  4619. tmpref.symbol:=l;
  4620. tmpref.base:=NR_R15;
  4621. list.concat(taicpu.op_reg_ref(A_LDR,tmpreg,tmpref));
  4622. { in case of LDF/STF, we got rid of the NR_R15 }
  4623. if is_pc(ref.base) then
  4624. ref.base:=NR_NO;
  4625. if is_pc(ref.index) then
  4626. ref.index:=NR_NO;
  4627. end
  4628. else
  4629. a_load_const_reg(list,OS_ADDR,ref.offset,tmpreg);
  4630. if (ref.base<>NR_NO) then
  4631. begin
  4632. if ref.index<>NR_NO then
  4633. begin
  4634. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4635. ref.base:=tmpreg;
  4636. end
  4637. else
  4638. begin
  4639. ref.index:=tmpreg;
  4640. ref.shiftimm:=0;
  4641. ref.signindex:=1;
  4642. ref.shiftmode:=SM_None;
  4643. end;
  4644. end
  4645. else
  4646. ref.base:=tmpreg;
  4647. ref.offset:=0;
  4648. ref.symbol:=nil;
  4649. end;
  4650. if (ref.base<>NR_NO) and (ref.index<>NR_NO) and (ref.offset<>0) then
  4651. begin
  4652. if tmpreg<>NR_NO then
  4653. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,tmpreg,tmpreg)
  4654. else
  4655. begin
  4656. tmpreg:=getintregister(list,OS_ADDR);
  4657. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,ref.offset,ref.base,tmpreg);
  4658. ref.base:=tmpreg;
  4659. end;
  4660. ref.offset:=0;
  4661. end;
  4662. { Hack? Thumb2 doesn't allow PC indexed addressing modes(although it does in the specification) }
  4663. if (ref.base=NR_R15) and (ref.index<>NR_NO) and (ref.shiftmode <> sm_none) then
  4664. begin
  4665. tmpreg:=getintregister(list,OS_ADDR);
  4666. list.concat(taicpu.op_reg_reg(A_MOV, tmpreg, NR_R15));
  4667. ref.base := tmpreg;
  4668. end;
  4669. { floating point operations have only limited references
  4670. we expect here, that a base is already set }
  4671. if ((op in [A_LDF,A_STF,A_FLDS,A_FLDD,A_FSTS,A_FSTD]) or (op=A_VSTR) or (op=A_VLDR)) and (ref.index<>NR_NO) then
  4672. begin
  4673. if ref.shiftmode<>SM_none then
  4674. internalerror(200309121);
  4675. if tmpreg<>NR_NO then
  4676. begin
  4677. if ref.base=tmpreg then
  4678. begin
  4679. if ref.signindex<0 then
  4680. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,tmpreg,ref.index))
  4681. else
  4682. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,tmpreg,ref.index));
  4683. ref.index:=NR_NO;
  4684. end
  4685. else
  4686. begin
  4687. if ref.index<>tmpreg then
  4688. internalerror(200403161);
  4689. if ref.signindex<0 then
  4690. list.concat(taicpu.op_reg_reg_reg(A_SUB,tmpreg,ref.base,tmpreg))
  4691. else
  4692. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  4693. ref.base:=tmpreg;
  4694. ref.index:=NR_NO;
  4695. end;
  4696. end
  4697. else
  4698. begin
  4699. tmpreg:=getintregister(list,OS_ADDR);
  4700. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));
  4701. ref.base:=tmpreg;
  4702. ref.index:=NR_NO;
  4703. end;
  4704. end;
  4705. list.concat(setoppostfix(taicpu.op_reg_ref(op,reg,ref),oppostfix));
  4706. Result := ref;
  4707. end;
  4708. procedure tthumb2cgarm.a_loadmm_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister; shuffle: pmmshuffle);
  4709. var
  4710. instr: taicpu;
  4711. begin
  4712. if (fromsize=OS_F32) and
  4713. (tosize=OS_F32) then
  4714. begin
  4715. instr:=setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32);
  4716. list.Concat(instr);
  4717. add_move_instruction(instr);
  4718. end
  4719. else if (fromsize=OS_F64) and
  4720. (tosize=OS_F64) then
  4721. begin
  4722. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,tregister(longint(reg2)+1),tregister(longint(reg1)+1)), PF_F32));
  4723. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VMOV,reg2,reg1), PF_F32));
  4724. end
  4725. else if (fromsize=OS_F32) and
  4726. (tosize=OS_F64) then
  4727. //list.Concat(setoppostfix(taicpu.op_reg_reg(A_VCVT,reg2,reg1), PF_F32))
  4728. begin
  4729. //list.concat(nil);
  4730. end;
  4731. end;
  4732. procedure tthumb2cgarm.a_loadmm_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister; shuffle: pmmshuffle);
  4733. begin
  4734. handle_load_store(list,A_VLDR,PF_None,reg,ref);
  4735. end;
  4736. procedure tthumb2cgarm.a_loadmm_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference; shuffle: pmmshuffle);
  4737. begin
  4738. handle_load_store(list,A_VSTR,PF_None,reg,ref);
  4739. end;
  4740. procedure tthumb2cgarm.a_loadmm_intreg_reg(list: TAsmList; fromsize, tosize: tcgsize; intreg, mmreg: tregister; shuffle: pmmshuffle);
  4741. begin
  4742. if //(shuffle=nil) and
  4743. (tosize=OS_F32) then
  4744. list.Concat(taicpu.op_reg_reg(A_VMOV,mmreg,intreg))
  4745. else
  4746. internalerror(2012100813);
  4747. end;
  4748. procedure tthumb2cgarm.a_loadmm_reg_intreg(list: TAsmList; fromsize, tosize: tcgsize; mmreg, intreg: tregister; shuffle: pmmshuffle);
  4749. begin
  4750. if //(shuffle=nil) and
  4751. (fromsize=OS_F32) then
  4752. list.Concat(taicpu.op_reg_reg(A_VMOV,intreg,mmreg))
  4753. else
  4754. internalerror(2012100814);
  4755. end;
  4756. procedure tthumb2cg64farm.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);
  4757. var tmpreg: tregister;
  4758. begin
  4759. case op of
  4760. OP_NEG:
  4761. begin
  4762. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4763. list.concat(setoppostfix(taicpu.op_reg_reg_const(A_RSB,regdst.reglo,regsrc.reglo,0),PF_S));
  4764. tmpreg:=cg.getintregister(list,OS_32);
  4765. list.concat(taicpu.op_reg_const(A_MOV,tmpreg,0));
  4766. list.concat(taicpu.op_reg_reg_reg(A_SBC,regdst.reghi,tmpreg,regsrc.reghi));
  4767. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4768. end;
  4769. else
  4770. inherited a_op64_reg_reg(list, op, size, regsrc, regdst);
  4771. end;
  4772. end;
  4773. procedure tthumbcg64farm.a_op64_reg_reg(list: TAsmList; op: TOpCG; size: tcgsize; regsrc, regdst: tregister64);
  4774. begin
  4775. case op of
  4776. OP_NEG:
  4777. begin
  4778. list.concat(taicpu.op_reg_const(A_MOV,regdst.reglo,0));
  4779. list.concat(taicpu.op_reg_const(A_MOV,regdst.reghi,0));
  4780. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4781. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4782. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4783. cg.a_reg_dealloc(list,NR_DEFAULTFLAGS);
  4784. end;
  4785. OP_NOT:
  4786. begin
  4787. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  4788. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  4789. end;
  4790. OP_AND,OP_OR,OP_XOR:
  4791. begin
  4792. cg.a_op_reg_reg(list,op,OS_32,regsrc.reglo,regdst.reglo);
  4793. cg.a_op_reg_reg(list,op,OS_32,regsrc.reghi,regdst.reghi);
  4794. end;
  4795. OP_ADD:
  4796. begin
  4797. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4798. list.concat(taicpu.op_reg_reg(A_ADD,regdst.reglo,regsrc.reglo));
  4799. list.concat(taicpu.op_reg_reg(A_ADC,regdst.reghi,regsrc.reghi));
  4800. end;
  4801. OP_SUB:
  4802. begin
  4803. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4804. list.concat(taicpu.op_reg_reg(A_SUB,regdst.reglo,regsrc.reglo));
  4805. list.concat(taicpu.op_reg_reg(A_SBC,regdst.reghi,regsrc.reghi));
  4806. end;
  4807. else
  4808. internalerror(2003083101);
  4809. end;
  4810. end;
  4811. procedure tthumbcg64farm.a_op64_const_reg(list: TAsmList; op: TOpCG; size: tcgsize; value: int64; reg: tregister64);
  4812. var
  4813. tmpreg : tregister;
  4814. b : byte;
  4815. begin
  4816. case op of
  4817. OP_AND,OP_OR,OP_XOR:
  4818. begin
  4819. cg.a_op_const_reg(list,op,OS_32,aint(lo(value)),reg.reglo);
  4820. cg.a_op_const_reg(list,op,OS_32,aint(hi(value)),reg.reghi);
  4821. end;
  4822. OP_ADD:
  4823. begin
  4824. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4825. begin
  4826. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4827. list.concat(taicpu.op_reg_const(A_ADD,reg.reglo,aint(lo(value))));
  4828. end
  4829. else
  4830. begin
  4831. tmpreg:=cg.getintregister(list,OS_32);
  4832. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4833. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4834. list.concat(taicpu.op_reg_reg(A_ADD,reg.reglo,tmpreg));
  4835. end;
  4836. tmpreg:=cg.getintregister(list,OS_32);
  4837. cg.a_load_const_reg(list,OS_32,aint(hi(value)),tmpreg);
  4838. list.concat(taicpu.op_reg_reg(A_ADC,reg.reghi,tmpreg));
  4839. end;
  4840. OP_SUB:
  4841. begin
  4842. if (aint(lo(value))>=0) and (aint(lo(value))<=255) then
  4843. begin
  4844. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4845. list.concat(taicpu.op_reg_const(A_SUB,reg.reglo,aint(lo(value))))
  4846. end
  4847. else
  4848. begin
  4849. tmpreg:=cg.getintregister(list,OS_32);
  4850. cg.a_load_const_reg(list,OS_32,aint(lo(value)),tmpreg);
  4851. cg.a_reg_alloc(list,NR_DEFAULTFLAGS);
  4852. list.concat(taicpu.op_reg_reg(A_SUB,reg.reglo,tmpreg));
  4853. end;
  4854. tmpreg:=cg.getintregister(list,OS_32);
  4855. cg.a_load_const_reg(list,OS_32,hi(value),tmpreg);
  4856. list.concat(taicpu.op_reg_reg(A_SBC,reg.reghi,tmpreg));
  4857. end;
  4858. else
  4859. internalerror(2003083101);
  4860. end;
  4861. end;
  4862. procedure create_codegen;
  4863. begin
  4864. if GenerateThumb2Code then
  4865. begin
  4866. cg:=tthumb2cgarm.create;
  4867. cg64:=tthumb2cg64farm.create;
  4868. casmoptimizer:=TCpuThumb2AsmOptimizer;
  4869. end
  4870. else if GenerateThumbCode then
  4871. begin
  4872. cg:=tthumbcgarm.create;
  4873. cg64:=tthumbcg64farm.create;
  4874. // casmoptimizer:=TCpuThumbAsmOptimizer;
  4875. end
  4876. else
  4877. begin
  4878. cg:=tarmcgarm.create;
  4879. cg64:=tarmcg64farm.create;
  4880. casmoptimizer:=TCpuAsmOptimizer;
  4881. end;
  4882. end;
  4883. end.