1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709 |
- {
- Copyright (c) 1998-2002 by Florian Klaempfl and Peter Vreman
- Contains the abstract assembler implementation for the i386
- * Portions of this code was inspired by the NASM sources
- The Netwide Assembler is Copyright (c) 1996 Simon Tatham and
- Julian Hall. All rights reserved.
- This program is free software; you can redistribute it and/or modify
- it under the terms of the GNU General Public License as published by
- the Free Software Foundation; either version 2 of the License, or
- (at your option) any later version.
- This program is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- GNU General Public License for more details.
- You should have received a copy of the GNU General Public License
- along with this program; if not, write to the Free Software
- Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
- ****************************************************************************
- }
- unit aasmcpu;
- {$i fpcdefs.inc}
- interface
- uses
- globtype,verbose,
- cpubase,
- cgbase,cgutils,
- symtype,
- aasmbase,aasmtai,aasmdata,aasmsym,
- ogbase;
- const
- { "mov reg,reg" source operand number }
- O_MOV_SOURCE = 0;
- { "mov reg,reg" destination operand number }
- O_MOV_DEST = 1;
- { Operand types }
- OT_NONE = $00000000;
- { Bits 0..7: sizes }
- OT_BITS8 = $00000001;
- OT_BITS16 = $00000002;
- OT_BITS32 = $00000004;
- OT_BITS64 = $00000008; { x86_64 and FPU }
- OT_BITS128 = $10000000; { 16 byte SSE }
- OT_BITS256 = $20000000; { 32 byte AVX }
- OT_BITS80 = $00000010; { FPU only }
- OT_FAR = $00000020; { this means 16:16 or 16:32, like in CALL/JMP }
- OT_NEAR = $00000040;
- OT_SHORT = $00000080;
- { TODO: FAR/NEAR/SHORT are sizes too, they should be included into size mask,
- but this requires adjusting the opcode table }
- OT_SIZE_MASK = $3000001F; { all the size attributes }
- OT_NON_SIZE = longint(not OT_SIZE_MASK);
- { Bits 8..11: modifiers }
- OT_SIGNED = $00000100; { the operand need to be signed -128-127 }
- OT_TO = $00000200; { reverse effect in FADD, FSUB &c }
- OT_COLON = $00000400; { operand is followed by a colon }
- OT_MODIFIER_MASK = $00000F00;
- { Bits 12..15: type of operand }
- OT_REGISTER = $00001000;
- OT_IMMEDIATE = $00002000;
- OT_MEMORY = $0000C000; { always includes 'OT_REGMEM' bit as well }
- OT_REGMEM = $00008000; { for r/m, ie EA, operands }
- OT_TYPE_MASK = OT_REGISTER or OT_IMMEDIATE or OT_MEMORY or OT_REGMEM;
- OT_REGNORM = OT_REGISTER or OT_REGMEM; { 'normal' reg, qualifies as EA }
- { Bits 20..22, 24..26: register classes
- otf_* consts are not used alone, only to build other constants. }
- otf_reg_cdt = $00100000;
- otf_reg_gpr = $00200000;
- otf_reg_sreg = $00400000;
- otf_reg_fpu = $01000000;
- otf_reg_mmx = $02000000;
- otf_reg_xmm = $04000000;
- otf_reg_ymm = $08000000;
- { Bits 16..19: subclasses, meaning depends on classes field }
- otf_sub0 = $00010000;
- otf_sub1 = $00020000;
- otf_sub2 = $00040000;
- otf_sub3 = $00080000;
- OT_REG_SMASK = otf_sub0 or otf_sub1 or otf_sub2 or otf_sub3;
- OT_REG_TYPMASK = otf_reg_cdt or otf_reg_gpr or otf_reg_sreg or otf_reg_fpu or otf_reg_mmx or otf_reg_xmm or otf_reg_ymm;
- { register class 0: CRx, DRx and TRx }
- {$ifdef x86_64}
- OT_REG_CDT = OT_REGISTER or otf_reg_cdt or OT_BITS64;
- {$else x86_64}
- OT_REG_CDT = OT_REGISTER or otf_reg_cdt or OT_BITS32;
- {$endif x86_64}
- OT_REG_CREG = OT_REG_CDT or otf_sub0; { CRn }
- OT_REG_DREG = OT_REG_CDT or otf_sub1; { DRn }
- OT_REG_TREG = OT_REG_CDT or otf_sub2; { TRn }
- OT_REG_CR4 = OT_REG_CDT or otf_sub3; { CR4 (Pentium only) }
- { register class 1: general-purpose registers }
- OT_REG_GPR = OT_REGNORM or otf_reg_gpr;
- OT_RM_GPR = OT_REGMEM or otf_reg_gpr;
- OT_REG8 = OT_REG_GPR or OT_BITS8; { 8-bit GPR }
- OT_REG16 = OT_REG_GPR or OT_BITS16;
- OT_REG32 = OT_REG_GPR or OT_BITS32;
- OT_REG64 = OT_REG_GPR or OT_BITS64;
- { GPR subclass 0: accumulator: AL, AX, EAX or RAX }
- OT_REG_ACCUM = OT_REG_GPR or otf_sub0;
- OT_REG_AL = OT_REG_ACCUM or OT_BITS8;
- OT_REG_AX = OT_REG_ACCUM or OT_BITS16;
- OT_REG_EAX = OT_REG_ACCUM or OT_BITS32;
- {$ifdef x86_64}
- OT_REG_RAX = OT_REG_ACCUM or OT_BITS64;
- {$endif x86_64}
- { GPR subclass 1: counter: CL, CX, ECX or RCX }
- OT_REG_COUNT = OT_REG_GPR or otf_sub1;
- OT_REG_CL = OT_REG_COUNT or OT_BITS8;
- OT_REG_CX = OT_REG_COUNT or OT_BITS16;
- OT_REG_ECX = OT_REG_COUNT or OT_BITS32;
- {$ifdef x86_64}
- OT_REG_RCX = OT_REG_COUNT or OT_BITS64;
- {$endif x86_64}
- { GPR subclass 2: data register: DL, DX, EDX or RDX }
- OT_REG_DX = OT_REG_GPR or otf_sub2 or OT_BITS16;
- OT_REG_EDX = OT_REG_GPR or otf_sub2 or OT_BITS32;
- { register class 2: Segment registers }
- OT_REG_SREG = OT_REGISTER or otf_reg_sreg or OT_BITS16;
- OT_REG_CS = OT_REG_SREG or otf_sub0; { CS }
- OT_REG_DESS = OT_REG_SREG or otf_sub1; { DS, ES, SS (non-CS 86 registers) }
- OT_REG_FSGS = OT_REG_SREG or otf_sub2; { FS, GS (386 extended registers) }
- { register class 3: FPU registers }
- OT_FPUREG = OT_REGISTER or otf_reg_fpu;
- OT_FPU0 = OT_FPUREG or otf_sub0; { FPU stack register zero }
- { register class 4: MMX (both reg and r/m) }
- OT_MMXREG = OT_REGNORM or otf_reg_mmx;
- OT_MMXRM = OT_REGMEM or otf_reg_mmx;
- { register class 5: XMM (both reg and r/m) }
- OT_XMMREG = OT_REGNORM or otf_reg_xmm;
- OT_XMMRM = OT_REGMEM or otf_reg_xmm;
- OT_XMEM32 = OT_REGNORM or otf_reg_xmm or otf_reg_gpr or OT_BITS32;
- OT_XMEM64 = OT_REGNORM or otf_reg_xmm or otf_reg_gpr or OT_BITS64;
- { register class 5: XMM (both reg and r/m) }
- OT_YMMREG = OT_REGNORM or otf_reg_ymm;
- OT_YMMRM = OT_REGMEM or otf_reg_ymm;
- OT_YMEM32 = OT_REGNORM or otf_reg_ymm or otf_reg_gpr or OT_BITS32;
- OT_YMEM64 = OT_REGNORM or otf_reg_ymm or otf_reg_gpr or OT_BITS64;
- { Vector-Memory operands }
- OT_VMEM_ANY = OT_XMEM32 or OT_XMEM64 or OT_YMEM32 or OT_YMEM64;
- { Memory operands }
- OT_MEM8 = OT_MEMORY or OT_BITS8;
- OT_MEM16 = OT_MEMORY or OT_BITS16;
- OT_MEM32 = OT_MEMORY or OT_BITS32;
- OT_MEM64 = OT_MEMORY or OT_BITS64;
- OT_MEM128 = OT_MEMORY or OT_BITS128;
- OT_MEM256 = OT_MEMORY or OT_BITS256;
- OT_MEM80 = OT_MEMORY or OT_BITS80;
- OT_MEM_OFFS = OT_MEMORY or otf_sub0; { special type of EA }
- { simple [address] offset }
- { Matches any type of r/m operand }
- OT_MEMORY_ANY = OT_MEMORY or OT_RM_GPR or OT_XMMRM or OT_MMXRM or OT_YMMRM;
- { Immediate operands }
- OT_IMM8 = OT_IMMEDIATE or OT_BITS8;
- OT_IMM16 = OT_IMMEDIATE or OT_BITS16;
- OT_IMM32 = OT_IMMEDIATE or OT_BITS32;
- OT_IMM64 = OT_IMMEDIATE or OT_BITS64;
- OT_ONENESS = otf_sub0; { special type of immediate operand }
- OT_UNITY = OT_IMMEDIATE or OT_ONENESS; { for shift/rotate instructions }
- { Size of the instruction table converted by nasmconv.pas }
- {$if defined(x86_64)}
- instabentries = {$i x8664nop.inc}
- {$elseif defined(i386)}
- instabentries = {$i i386nop.inc}
- {$elseif defined(i8086)}
- instabentries = {$i i8086nop.inc}
- {$endif}
- maxinfolen = 8;
- MaxInsChanges = 3; { Max things a instruction can change }
- type
- { What an instruction can change. Needed for optimizer and spilling code.
- Note: The order of this enumeration is should not be changed! }
- TInsChange = (Ch_None,
- {Read from a register}
- Ch_REAX, Ch_RECX, Ch_REDX, Ch_REBX, Ch_RESP, Ch_REBP, Ch_RESI, Ch_REDI,
- {write from a register}
- Ch_WEAX, Ch_WECX, Ch_WEDX, Ch_WEBX, Ch_WESP, Ch_WEBP, Ch_WESI, Ch_WEDI,
- {read and write from/to a register}
- Ch_RWEAX, Ch_RWECX, Ch_RWEDX, Ch_RWEBX, Ch_RWESP, Ch_RWEBP, Ch_RWESI, Ch_RWEDI,
- {modify the contents of a register with the purpose of using
- this changed content afterwards (add/sub/..., but e.g. not rep
- or movsd)}
- Ch_MEAX, Ch_MECX, Ch_MEDX, Ch_MEBX, Ch_MESP, Ch_MEBP, Ch_MESI, Ch_MEDI,
- Ch_CDirFlag {clear direction flag}, Ch_SDirFlag {set dir flag},
- Ch_RFlags, Ch_WFlags, Ch_RWFlags, Ch_FPU,
- Ch_Rop1, Ch_Wop1, Ch_RWop1,Ch_Mop1,
- Ch_Rop2, Ch_Wop2, Ch_RWop2,Ch_Mop2,
- Ch_Rop3, Ch_WOp3, Ch_RWOp3,Ch_Mop3,
- Ch_WMemEDI,
- Ch_All,
- { x86_64 registers }
- Ch_RRAX, Ch_RRCX, Ch_RRDX, Ch_RRBX, Ch_RRSP, Ch_RRBP, Ch_RRSI, Ch_RRDI,
- Ch_WRAX, Ch_WRCX, Ch_WRDX, Ch_WRBX, Ch_WRSP, Ch_WRBP, Ch_WRSI, Ch_WRDI,
- Ch_RWRAX, Ch_RWRCX, Ch_RWRDX, Ch_RWRBX, Ch_RWRSP, Ch_RWRBP, Ch_RWRSI, Ch_RWRDI,
- Ch_MRAX, Ch_MRCX, Ch_MRDX, Ch_MRBX, Ch_MRSP, Ch_MRBP, Ch_MRSI, Ch_MRDI
- );
- TInsProp = packed record
- Ch : Array[1..MaxInsChanges] of TInsChange;
- end;
- TMemRefSizeInfo = (msiUnkown, msiUnsupported, msiNoSize,
- msiMultiple, msiMultiple8, msiMultiple16, msiMultiple32,
- msiMultiple64, msiMultiple128, msiMultiple256,
- msiMemRegSize, msiMemRegx16y32, msiMemRegx32y64, msiMemRegx64y128, msiMemRegx64y256,
- msiMem8, msiMem16, msiMem32, msiMem64, msiMem128, msiMem256,
- msiXMem32, msiXMem64, msiYMem32, msiYMem64,
- msiVMemMultiple, msiVMemRegSize);
- TConstSizeInfo = (csiUnkown, csiMultiple, csiNoSize, csiMem8, csiMem16, csiMem32, csiMem64);
- TInsTabMemRefSizeInfoRec = record
- MemRefSize : TMemRefSizeInfo;
- ExistsSSEAVX: boolean;
- ConstSize : TConstSizeInfo;
- end;
- const
- MemRefMultiples: set of TMemRefSizeInfo = [msiMultiple, msiMultiple8,
- msiMultiple16, msiMultiple32,
- msiMultiple64, msiMultiple128,
- msiMultiple256, msiVMemMultiple];
- MemRefSizeInfoVMems: Set of TMemRefSizeInfo = [msiXMem32, msiXMem64, msiYMem32, msiYMem64,
- msiVMemMultiple, msiVMemRegSize];
- InsProp : array[tasmop] of TInsProp =
- {$if defined(x86_64)}
- {$i x8664pro.inc}
- {$elseif defined(i386)}
- {$i i386prop.inc}
- {$elseif defined(i8086)}
- {$i i8086prop.inc}
- {$endif}
- type
- TOperandOrder = (op_intel,op_att);
- tinsentry=packed record
- opcode : tasmop;
- ops : byte;
- optypes : array[0..max_operands-1] of longint;
- code : array[0..maxinfolen] of char;
- flags : int64;
- end;
- pinsentry=^tinsentry;
- { alignment for operator }
- tai_align = class(tai_align_abstract)
- reg : tregister;
- constructor create(b:byte);override;
- constructor create_op(b: byte; _op: byte);override;
- function calculatefillbuf(var buf : tfillbuffer;executable : boolean):pchar;override;
- end;
- taicpu = class(tai_cpu_abstract_sym)
- opsize : topsize;
- constructor op_none(op : tasmop);
- constructor op_none(op : tasmop;_size : topsize);
- constructor op_reg(op : tasmop;_size : topsize;_op1 : tregister);
- constructor op_const(op : tasmop;_size : topsize;_op1 : aint);
- constructor op_ref(op : tasmop;_size : topsize;const _op1 : treference);
- constructor op_reg_reg(op : tasmop;_size : topsize;_op1,_op2 : tregister);
- constructor op_reg_ref(op : tasmop;_size : topsize;_op1 : tregister;const _op2 : treference);
- constructor op_reg_const(op:tasmop; _size: topsize; _op1: tregister; _op2: aint);
- constructor op_const_reg(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister);
- constructor op_const_const(op : tasmop;_size : topsize;_op1,_op2 : aint);
- constructor op_const_ref(op : tasmop;_size : topsize;_op1 : aint;const _op2 : treference);
- constructor op_ref_reg(op : tasmop;_size : topsize;const _op1 : treference;_op2 : tregister);
- constructor op_reg_reg_reg(op : tasmop;_size : topsize;_op1,_op2,_op3 : tregister);
- constructor op_const_reg_reg(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister;_op3 : tregister);
- constructor op_const_ref_reg(op : tasmop;_size : topsize;_op1 : aint;const _op2 : treference;_op3 : tregister);
- constructor op_ref_reg_reg(op : tasmop;_size : topsize;const _op1 : treference;_op2,_op3 : tregister);
- constructor op_const_reg_ref(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister;const _op3 : treference);
- { this is for Jmp instructions }
- constructor op_cond_sym(op : tasmop;cond:TAsmCond;_size : topsize;_op1 : tasmsymbol);
- constructor op_sym(op : tasmop;_size : topsize;_op1 : tasmsymbol);
- constructor op_sym_ofs(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint);
- constructor op_sym_ofs_reg(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint;_op2 : tregister);
- constructor op_sym_ofs_ref(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint;const _op2 : treference);
- procedure changeopsize(siz:topsize);
- function GetString:string;
- { This is a workaround for the GAS non commutative fpu instruction braindamage.
- Early versions of the UnixWare assembler had a bug where some fpu instructions
- were reversed and GAS still keeps this "feature" for compatibility.
- for details: http://sourceware.org/binutils/docs/as/i386_002dBugs.html#i386_002dBugs
- http://bugs.debian.org/cgi-bin/bugreport.cgi?bug=372528
- http://en.wikibooks.org/wiki/X86_Assembly/GAS_Syntax#Caveats
- Since FPC is "GAS centric" due to its history it generates instructions with the same operand order so
- when generating output for other assemblers, the opcodes must be fixed before writing them.
- This function returns the fixed opcodes. Changing the opcodes permanently is no good idea
- because in case of smartlinking assembler is generated twice so at the second run wrong
- assembler is generated.
- }
- function FixNonCommutativeOpcodes: tasmop;
- private
- FOperandOrder : TOperandOrder;
- procedure init(_size : topsize); { this need to be called by all constructor }
- public
- { the next will reset all instructions that can change in pass 2 }
- procedure ResetPass1;override;
- procedure ResetPass2;override;
- function CheckIfValid:boolean;
- function Pass1(objdata:TObjData):longint;override;
- procedure Pass2(objdata:TObjData);override;
- procedure SetOperandOrder(order:TOperandOrder);
- function is_same_reg_move(regtype: Tregistertype):boolean;override;
- { register spilling code }
- function spilling_get_operation_type(opnr: longint): topertype;override;
- private
- { next fields are filled in pass1, so pass2 is faster }
- insentry : PInsEntry;
- insoffset : longint;
- LastInsOffset : longint; { need to be public to be reset }
- inssize : shortint;
- {$ifdef x86_64}
- rex : byte;
- {$endif x86_64}
- function InsEnd:longint;
- procedure create_ot(objdata:TObjData);
- function Matches(p:PInsEntry):boolean;
- function calcsize(p:PInsEntry):shortint;
- procedure gencode(objdata:TObjData);
- function NeedAddrPrefix(opidx:byte):boolean;
- procedure Swapoperands;
- function FindInsentry(objdata:TObjData):boolean;
- end;
- function spilling_create_load(const ref:treference;r:tregister):Taicpu;
- function spilling_create_store(r:tregister; const ref:treference):Taicpu;
- function MemRefInfo(aAsmop: TAsmOp): TInsTabMemRefSizeInfoRec;
- procedure InitAsm;
- procedure DoneAsm;
- implementation
- uses
- cutils,
- globals,
- systems,
- procinfo,
- itcpugas,
- symsym,
- cpuinfo;
- {*****************************************************************************
- Instruction table
- *****************************************************************************}
- const
- {Instruction flags }
- IF_NONE = $00000000;
- IF_SM = $00000001; { size match first two operands }
- IF_SM2 = $00000002;
- IF_SB = $00000004; { unsized operands can't be non-byte }
- IF_SW = $00000008; { unsized operands can't be non-word }
- IF_SD = $00000010; { unsized operands can't be nondword }
- IF_SMASK = $0000001f;
- IF_AR0 = $00000020; { SB, SW, SD applies to argument 0 }
- IF_AR1 = $00000040; { SB, SW, SD applies to argument 1 }
- IF_AR2 = $00000060; { SB, SW, SD applies to argument 2 }
- IF_ARMASK = $00000060; { mask for unsized argument spec }
- IF_ARSHIFT = 5; { LSB of IF_ARMASK }
- IF_PRIV = $00000100; { it's a privileged instruction }
- IF_SMM = $00000200; { it's only valid in SMM }
- IF_PROT = $00000400; { it's protected mode only }
- IF_NOX86_64 = $00000800; { removed instruction in x86_64 }
- IF_UNDOC = $00001000; { it's an undocumented instruction }
- IF_FPU = $00002000; { it's an FPU instruction }
- IF_MMX = $00004000; { it's an MMX instruction }
- { it's a 3DNow! instruction }
- IF_3DNOW = $00008000;
- { it's a SSE (KNI, MMX2) instruction }
- IF_SSE = $00010000;
- { SSE2 instructions }
- IF_SSE2 = $00020000;
- { SSE3 instructions }
- IF_SSE3 = $00040000;
- { SSE64 instructions }
- IF_SSE64 = $00080000;
- { the mask for processor types }
- {IF_PMASK = longint($FF000000);}
- { the mask for disassembly "prefer" }
- {IF_PFMASK = longint($F001FF00);}
- { SVM instructions }
- IF_SVM = $00100000;
- { SSE4 instructions }
- IF_SSE4 = $00200000;
- { TODO: These flags were added to make x86ins.dat more readable.
- Values must be reassigned to make any other use of them. }
- IF_SSSE3 = $00200000;
- IF_SSE41 = $00200000;
- IF_SSE42 = $00200000;
- IF_AVX = $00200000;
- IF_AVX2 = $00200000;
- IF_BMI1 = $00200000;
- IF_BMI2 = $00200000;
- IF_16BITONLY = $00200000;
- IF_FMA = $00200000;
- IF_FMA4 = $00200000;
- IF_PLEVEL = $0F000000; { mask for processor level }
- IF_8086 = $00000000; { 8086 instruction }
- IF_186 = $01000000; { 186+ instruction }
- IF_286 = $02000000; { 286+ instruction }
- IF_386 = $03000000; { 386+ instruction }
- IF_486 = $04000000; { 486+ instruction }
- IF_PENT = $05000000; { Pentium instruction }
- IF_P6 = $06000000; { P6 instruction }
- IF_KATMAI = $07000000; { Katmai instructions }
- IF_WILLAMETTE = $08000000; { Willamette instructions }
- IF_PRESCOTT = $09000000; { Prescott instructions }
- IF_X86_64 = $0a000000;
- IF_CYRIX = $0b000000; { Cyrix-specific instruction }
- IF_AMD = $0c000000; { AMD-specific instruction }
- IF_CENTAUR = $0d000000; { centaur-specific instruction }
- IF_SANDYBRIDGE = $0e000000; { Sandybridge-specific instruction }
- IF_NEC = $0f000000; { NEC V20/V30 instruction }
- { added flags }
- IF_PRE = $40000000; { it's a prefix instruction }
- IF_PASS2 = $80000000; { if the instruction can change in a second pass }
- type
- TInsTabCache=array[TasmOp] of longint;
- PInsTabCache=^TInsTabCache;
- TInsTabMemRefSizeInfoCache=array[TasmOp] of TInsTabMemRefSizeInfoRec;
- PInsTabMemRefSizeInfoCache=^TInsTabMemRefSizeInfoCache;
- const
- {$if defined(x86_64)}
- InsTab:array[0..instabentries-1] of TInsEntry={$i x8664tab.inc}
- {$elseif defined(i386)}
- InsTab:array[0..instabentries-1] of TInsEntry={$i i386tab.inc}
- {$elseif defined(i8086)}
- InsTab:array[0..instabentries-1] of TInsEntry={$i i8086tab.inc}
- {$endif}
- var
- InsTabCache : PInsTabCache;
- InsTabMemRefSizeInfoCache: PInsTabMemRefSizeInfoCache;
- const
- {$if defined(x86_64)}
- { Intel style operands ! }
- opsize_2_type:array[0..2,topsize] of longint=(
- (OT_NONE,
- OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS16,OT_BITS32,OT_BITS32,OT_BITS64,OT_BITS64,OT_BITS64,
- OT_BITS16,OT_BITS32,OT_BITS64,
- OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,
- OT_BITS64,
- OT_NEAR,OT_FAR,OT_SHORT,
- OT_NONE,
- OT_BITS128,
- OT_BITS256
- ),
- (OT_NONE,
- OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS8,OT_BITS8,OT_BITS16,OT_BITS8,OT_BITS16,OT_BITS32,
- OT_BITS16,OT_BITS32,OT_BITS64,
- OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,
- OT_BITS64,
- OT_NEAR,OT_FAR,OT_SHORT,
- OT_NONE,
- OT_BITS128,
- OT_BITS256
- ),
- (OT_NONE,
- OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_NONE,OT_NONE,OT_NONE,OT_NONE,OT_NONE,OT_NONE,
- OT_BITS16,OT_BITS32,OT_BITS64,
- OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,
- OT_BITS64,
- OT_NEAR,OT_FAR,OT_SHORT,
- OT_NONE,
- OT_BITS128,
- OT_BITS256
- )
- );
- reg_ot_table : array[tregisterindex] of longint = (
- {$i r8664ot.inc}
- );
- {$elseif defined(i386)}
- { Intel style operands ! }
- opsize_2_type:array[0..2,topsize] of longint=(
- (OT_NONE,
- OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS16,OT_BITS32,OT_BITS32,
- OT_BITS16,OT_BITS32,OT_BITS64,
- OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,
- OT_BITS64,
- OT_NEAR,OT_FAR,OT_SHORT,
- OT_NONE,
- OT_BITS128,
- OT_BITS256
- ),
- (OT_NONE,
- OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS8,OT_BITS8,OT_BITS16,
- OT_BITS16,OT_BITS32,OT_BITS64,
- OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,
- OT_BITS64,
- OT_NEAR,OT_FAR,OT_SHORT,
- OT_NONE,
- OT_BITS128,
- OT_BITS256
- ),
- (OT_NONE,
- OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_NONE,OT_NONE,OT_NONE,
- OT_BITS16,OT_BITS32,OT_BITS64,
- OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,
- OT_BITS64,
- OT_NEAR,OT_FAR,OT_SHORT,
- OT_NONE,
- OT_BITS128,
- OT_BITS256
- )
- );
- reg_ot_table : array[tregisterindex] of longint = (
- {$i r386ot.inc}
- );
- {$elseif defined(i8086)}
- { Intel style operands ! }
- opsize_2_type:array[0..2,topsize] of longint=(
- (OT_NONE,
- OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS16,OT_BITS32,OT_BITS32,
- OT_BITS16,OT_BITS32,OT_BITS64,
- OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,
- OT_BITS64,
- OT_NEAR,OT_FAR,OT_SHORT,
- OT_NONE,
- OT_BITS128,
- OT_BITS256
- ),
- (OT_NONE,
- OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS8,OT_BITS8,OT_BITS16,
- OT_BITS16,OT_BITS32,OT_BITS64,
- OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,
- OT_BITS64,
- OT_NEAR,OT_FAR,OT_SHORT,
- OT_NONE,
- OT_BITS128,
- OT_BITS256
- ),
- (OT_NONE,
- OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_NONE,OT_NONE,OT_NONE,
- OT_BITS16,OT_BITS32,OT_BITS64,
- OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,
- OT_BITS64,
- OT_NEAR,OT_FAR,OT_SHORT,
- OT_NONE,
- OT_BITS128,
- OT_BITS256
- )
- );
- reg_ot_table : array[tregisterindex] of longint = (
- {$i r8086ot.inc}
- );
- {$endif}
- function MemRefInfo(aAsmop: TAsmOp): TInsTabMemRefSizeInfoRec;
- begin
- result := InsTabMemRefSizeInfoCache^[aAsmop];
- end;
- { Operation type for spilling code }
- type
- toperation_type_table=array[tasmop,0..Max_Operands] of topertype;
- var
- operation_type_table : ^toperation_type_table;
- {****************************************************************************
- TAI_ALIGN
- ****************************************************************************}
- constructor tai_align.create(b: byte);
- begin
- inherited create(b);
- reg:=NR_ECX;
- end;
- constructor tai_align.create_op(b: byte; _op: byte);
- begin
- inherited create_op(b,_op);
- reg:=NR_NO;
- end;
- function tai_align.calculatefillbuf(var buf : tfillbuffer;executable : boolean):pchar;
- const
- { Updated according to
- Software Optimization Guide for AMD Family 15h Processors, Verison 3.08, January 2014
- and
- Intel 64 and IA-32 Architectures Software Developer’s Manual
- Volume 2B: Instruction Set Reference, N-Z, January 2015
- }
- alignarray_cmovcpus:array[0..10] of string[11]=(
- #$66#$66#$66#$0F#$1F#$84#$00#$00#$00#$00#$00,
- #$66#$66#$0F#$1F#$84#$00#$00#$00#$00#$00,
- #$66#$0F#$1F#$84#$00#$00#$00#$00#$00,
- #$0F#$1F#$84#$00#$00#$00#$00#$00,
- #$0F#$1F#$80#$00#$00#$00#$00,
- #$66#$0F#$1F#$44#$00#$00,
- #$0F#$1F#$44#$00#$00,
- #$0F#$1F#$40#$00,
- #$0F#$1F#$00,
- #$66#$90,
- #$90);
- alignarray:array[0..5] of string[8]=(
- #$8D#$B4#$26#$00#$00#$00#$00,
- #$8D#$B6#$00#$00#$00#$00,
- #$8D#$74#$26#$00,
- #$8D#$76#$00,
- #$89#$F6,
- #$90);
- var
- bufptr : pchar;
- j : longint;
- localsize: byte;
- begin
- inherited calculatefillbuf(buf,executable);
- if not(use_op) and executable then
- begin
- bufptr:=pchar(@buf);
- { fillsize may still be used afterwards, so don't modify }
- { e.g. writebytes(hp.calculatefillbuf(buf)^,hp.fillsize) }
- localsize:=fillsize;
- while (localsize>0) do
- begin
- {$ifndef i8086}
- if CPUX86_HAS_CMOV in cpu_capabilities[current_settings.cputype] then
- begin
- for j:=low(alignarray_cmovcpus) to high(alignarray_cmovcpus) do
- if (localsize>=length(alignarray_cmovcpus[j])) then
- break;
- move(alignarray_cmovcpus[j][1],bufptr^,length(alignarray_cmovcpus[j]));
- inc(bufptr,length(alignarray_cmovcpus[j]));
- dec(localsize,length(alignarray_cmovcpus[j]));
- end
- else
- {$endif not i8086}
- begin
- for j:=low(alignarray) to high(alignarray) do
- if (localsize>=length(alignarray[j])) then
- break;
- move(alignarray[j][1],bufptr^,length(alignarray[j]));
- inc(bufptr,length(alignarray[j]));
- dec(localsize,length(alignarray[j]));
- end
- end;
- end;
- calculatefillbuf:=pchar(@buf);
- end;
- {*****************************************************************************
- Taicpu Constructors
- *****************************************************************************}
- procedure taicpu.changeopsize(siz:topsize);
- begin
- opsize:=siz;
- end;
- procedure taicpu.init(_size : topsize);
- begin
- { default order is att }
- FOperandOrder:=op_att;
- segprefix:=NR_NO;
- opsize:=_size;
- insentry:=nil;
- LastInsOffset:=-1;
- InsOffset:=0;
- InsSize:=0;
- end;
- constructor taicpu.op_none(op : tasmop);
- begin
- inherited create(op);
- init(S_NO);
- end;
- constructor taicpu.op_none(op : tasmop;_size : topsize);
- begin
- inherited create(op);
- init(_size);
- end;
- constructor taicpu.op_reg(op : tasmop;_size : topsize;_op1 : tregister);
- begin
- inherited create(op);
- init(_size);
- ops:=1;
- loadreg(0,_op1);
- end;
- constructor taicpu.op_const(op : tasmop;_size : topsize;_op1 : aint);
- begin
- inherited create(op);
- init(_size);
- ops:=1;
- loadconst(0,_op1);
- end;
- constructor taicpu.op_ref(op : tasmop;_size : topsize;const _op1 : treference);
- begin
- inherited create(op);
- init(_size);
- ops:=1;
- loadref(0,_op1);
- end;
- constructor taicpu.op_reg_reg(op : tasmop;_size : topsize;_op1,_op2 : tregister);
- begin
- inherited create(op);
- init(_size);
- ops:=2;
- loadreg(0,_op1);
- loadreg(1,_op2);
- end;
- constructor taicpu.op_reg_const(op:tasmop; _size: topsize; _op1: tregister; _op2: aint);
- begin
- inherited create(op);
- init(_size);
- ops:=2;
- loadreg(0,_op1);
- loadconst(1,_op2);
- end;
- constructor taicpu.op_reg_ref(op : tasmop;_size : topsize;_op1 : tregister;const _op2 : treference);
- begin
- inherited create(op);
- init(_size);
- ops:=2;
- loadreg(0,_op1);
- loadref(1,_op2);
- end;
- constructor taicpu.op_const_reg(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister);
- begin
- inherited create(op);
- init(_size);
- ops:=2;
- loadconst(0,_op1);
- loadreg(1,_op2);
- end;
- constructor taicpu.op_const_const(op : tasmop;_size : topsize;_op1,_op2 : aint);
- begin
- inherited create(op);
- init(_size);
- ops:=2;
- loadconst(0,_op1);
- loadconst(1,_op2);
- end;
- constructor taicpu.op_const_ref(op : tasmop;_size : topsize;_op1 : aint;const _op2 : treference);
- begin
- inherited create(op);
- init(_size);
- ops:=2;
- loadconst(0,_op1);
- loadref(1,_op2);
- end;
- constructor taicpu.op_ref_reg(op : tasmop;_size : topsize;const _op1 : treference;_op2 : tregister);
- begin
- inherited create(op);
- init(_size);
- ops:=2;
- loadref(0,_op1);
- loadreg(1,_op2);
- end;
- constructor taicpu.op_reg_reg_reg(op : tasmop;_size : topsize;_op1,_op2,_op3 : tregister);
- begin
- inherited create(op);
- init(_size);
- ops:=3;
- loadreg(0,_op1);
- loadreg(1,_op2);
- loadreg(2,_op3);
- end;
- constructor taicpu.op_const_reg_reg(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister;_op3 : tregister);
- begin
- inherited create(op);
- init(_size);
- ops:=3;
- loadconst(0,_op1);
- loadreg(1,_op2);
- loadreg(2,_op3);
- end;
- constructor taicpu.op_ref_reg_reg(op : tasmop;_size : topsize;const _op1 : treference;_op2,_op3 : tregister);
- begin
- inherited create(op);
- init(_size);
- ops:=3;
- loadref(0,_op1);
- loadreg(1,_op2);
- loadreg(2,_op3);
- end;
- constructor taicpu.op_const_ref_reg(op : tasmop;_size : topsize;_op1 : aint;const _op2 : treference;_op3 : tregister);
- begin
- inherited create(op);
- init(_size);
- ops:=3;
- loadconst(0,_op1);
- loadref(1,_op2);
- loadreg(2,_op3);
- end;
- constructor taicpu.op_const_reg_ref(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister;const _op3 : treference);
- begin
- inherited create(op);
- init(_size);
- ops:=3;
- loadconst(0,_op1);
- loadreg(1,_op2);
- loadref(2,_op3);
- end;
- constructor taicpu.op_cond_sym(op : tasmop;cond:TAsmCond;_size : topsize;_op1 : tasmsymbol);
- begin
- inherited create(op);
- init(_size);
- condition:=cond;
- ops:=1;
- loadsymbol(0,_op1,0);
- end;
- constructor taicpu.op_sym(op : tasmop;_size : topsize;_op1 : tasmsymbol);
- begin
- inherited create(op);
- init(_size);
- ops:=1;
- loadsymbol(0,_op1,0);
- end;
- constructor taicpu.op_sym_ofs(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint);
- begin
- inherited create(op);
- init(_size);
- ops:=1;
- loadsymbol(0,_op1,_op1ofs);
- end;
- constructor taicpu.op_sym_ofs_reg(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint;_op2 : tregister);
- begin
- inherited create(op);
- init(_size);
- ops:=2;
- loadsymbol(0,_op1,_op1ofs);
- loadreg(1,_op2);
- end;
- constructor taicpu.op_sym_ofs_ref(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint;const _op2 : treference);
- begin
- inherited create(op);
- init(_size);
- ops:=2;
- loadsymbol(0,_op1,_op1ofs);
- loadref(1,_op2);
- end;
- function taicpu.GetString:string;
- var
- i : longint;
- s : string;
- addsize : boolean;
- begin
- s:='['+std_op2str[opcode];
- for i:=0 to ops-1 do
- begin
- with oper[i]^ do
- begin
- if i=0 then
- s:=s+' '
- else
- s:=s+',';
- { type }
- addsize:=false;
- if (ot and OT_XMMREG)=OT_XMMREG then
- s:=s+'xmmreg'
- else
- if (ot and OT_YMMREG)=OT_YMMREG then
- s:=s+'ymmreg'
- else
- if (ot and OT_MMXREG)=OT_MMXREG then
- s:=s+'mmxreg'
- else
- if (ot and OT_FPUREG)=OT_FPUREG then
- s:=s+'fpureg'
- else
- if (ot and OT_REGISTER)=OT_REGISTER then
- begin
- s:=s+'reg';
- addsize:=true;
- end
- else
- if (ot and OT_IMMEDIATE)=OT_IMMEDIATE then
- begin
- s:=s+'imm';
- addsize:=true;
- end
- else
- if (ot and OT_MEMORY)=OT_MEMORY then
- begin
- s:=s+'mem';
- addsize:=true;
- end
- else
- s:=s+'???';
- { size }
- if addsize then
- begin
- if (ot and OT_BITS8)<>0 then
- s:=s+'8'
- else
- if (ot and OT_BITS16)<>0 then
- s:=s+'16'
- else
- if (ot and OT_BITS32)<>0 then
- s:=s+'32'
- else
- if (ot and OT_BITS64)<>0 then
- s:=s+'64'
- else
- if (ot and OT_BITS128)<>0 then
- s:=s+'128'
- else
- if (ot and OT_BITS256)<>0 then
- s:=s+'256'
- else
- s:=s+'??';
- { signed }
- if (ot and OT_SIGNED)<>0 then
- s:=s+'s';
- end;
- end;
- end;
- GetString:=s+']';
- end;
- procedure taicpu.Swapoperands;
- var
- p : POper;
- begin
- { Fix the operands which are in AT&T style and we need them in Intel style }
- case ops of
- 0,1:
- ;
- 2 : begin
- { 0,1 -> 1,0 }
- p:=oper[0];
- oper[0]:=oper[1];
- oper[1]:=p;
- end;
- 3 : begin
- { 0,1,2 -> 2,1,0 }
- p:=oper[0];
- oper[0]:=oper[2];
- oper[2]:=p;
- end;
- 4 : begin
- { 0,1,2,3 -> 3,2,1,0 }
- p:=oper[0];
- oper[0]:=oper[3];
- oper[3]:=p;
- p:=oper[1];
- oper[1]:=oper[2];
- oper[2]:=p;
- end;
- else
- internalerror(201108141);
- end;
- end;
- procedure taicpu.SetOperandOrder(order:TOperandOrder);
- begin
- if FOperandOrder<>order then
- begin
- Swapoperands;
- FOperandOrder:=order;
- end;
- end;
- function taicpu.FixNonCommutativeOpcodes: tasmop;
- begin
- result:=opcode;
- { we need ATT order }
- SetOperandOrder(op_att);
- if (
- (ops=2) and
- (oper[0]^.typ=top_reg) and
- (oper[1]^.typ=top_reg) and
- { if the first is ST and the second is also a register
- it is necessarily ST1 .. ST7 }
- ((oper[0]^.reg=NR_ST) or
- (oper[0]^.reg=NR_ST0))
- ) or
- { ((ops=1) and
- (oper[0]^.typ=top_reg) and
- (oper[0]^.reg in [R_ST1..R_ST7])) or}
- (ops=0) then
- begin
- if opcode=A_FSUBR then
- result:=A_FSUB
- else if opcode=A_FSUB then
- result:=A_FSUBR
- else if opcode=A_FDIVR then
- result:=A_FDIV
- else if opcode=A_FDIV then
- result:=A_FDIVR
- else if opcode=A_FSUBRP then
- result:=A_FSUBP
- else if opcode=A_FSUBP then
- result:=A_FSUBRP
- else if opcode=A_FDIVRP then
- result:=A_FDIVP
- else if opcode=A_FDIVP then
- result:=A_FDIVRP;
- end;
- if (
- (ops=1) and
- (oper[0]^.typ=top_reg) and
- (getregtype(oper[0]^.reg)=R_FPUREGISTER) and
- (oper[0]^.reg<>NR_ST)
- ) then
- begin
- if opcode=A_FSUBRP then
- result:=A_FSUBP
- else if opcode=A_FSUBP then
- result:=A_FSUBRP
- else if opcode=A_FDIVRP then
- result:=A_FDIVP
- else if opcode=A_FDIVP then
- result:=A_FDIVRP;
- end;
- end;
- {*****************************************************************************
- Assembler
- *****************************************************************************}
- type
- ea = packed record
- sib_present : boolean;
- bytes : byte;
- size : byte;
- modrm : byte;
- sib : byte;
- {$ifdef x86_64}
- rex : byte;
- {$endif x86_64}
- end;
- procedure taicpu.create_ot(objdata:TObjData);
- {
- this function will also fix some other fields which only needs to be once
- }
- var
- i,l,relsize : longint;
- currsym : TObjSymbol;
- begin
- if ops=0 then
- exit;
- { update oper[].ot field }
- for i:=0 to ops-1 do
- with oper[i]^ do
- begin
- case typ of
- top_reg :
- begin
- ot:=reg_ot_table[findreg_by_number(reg)];
- end;
- top_ref :
- begin
- if (ref^.refaddr=addr_no)
- {$ifdef i386}
- or (
- (ref^.refaddr in [addr_pic]) and
- { allow any base for assembler blocks }
- ((assigned(current_procinfo) and
- (pi_has_assembler_block in current_procinfo.flags) and
- (ref^.base<>NR_NO)) or (ref^.base=NR_EBX))
- )
- {$endif i386}
- {$ifdef x86_64}
- or (
- (ref^.refaddr in [addr_pic,addr_pic_no_got]) and
- (ref^.base<>NR_NO)
- )
- {$endif x86_64}
- then
- begin
- { create ot field }
- if (reg_ot_table[findreg_by_number(ref^.base)] and OT_REG_GPR = OT_REG_GPR) and
- ((reg_ot_table[findreg_by_number(ref^.index)] = OT_XMMREG) or
- (reg_ot_table[findreg_by_number(ref^.index)] = OT_YMMREG)
- ) then
- // AVX2 - vector-memory-referenz (e.g. vgatherdpd xmm0, [rax xmm1], xmm2)
- ot := (reg_ot_table[findreg_by_number(ref^.base)] and OT_REG_GPR) or
- (reg_ot_table[findreg_by_number(ref^.index)])
- else if (ref^.base = NR_NO) and
- ((reg_ot_table[findreg_by_number(ref^.index)] = OT_XMMREG) or
- (reg_ot_table[findreg_by_number(ref^.index)] = OT_YMMREG)
- ) then
- // AVX2 - vector-memory-referenz without base-register (e.g. vgatherdpd xmm0, [xmm1], xmm2)
- ot := (OT_REG_GPR) or
- (reg_ot_table[findreg_by_number(ref^.index)])
- else if (ot and OT_SIZE_MASK)=0 then
- ot:=OT_MEMORY_ANY or opsize_2_type[i,opsize]
- else
- ot:=OT_MEMORY_ANY or (ot and OT_SIZE_MASK);
- if (ref^.base=NR_NO) and (ref^.index=NR_NO) then
- ot:=ot or OT_MEM_OFFS;
- { fix scalefactor }
- if (ref^.index=NR_NO) then
- ref^.scalefactor:=0
- else
- if (ref^.scalefactor=0) then
- ref^.scalefactor:=1;
- end
- else
- begin
- { Jumps use a relative offset which can be 8bit,
- for other opcodes we always need to generate the full
- 32bit address }
- if assigned(objdata) and
- is_jmp then
- begin
- currsym:=objdata.symbolref(ref^.symbol);
- l:=ref^.offset;
- {$push}
- {$r-,q-} { disable also overflow as address returns a qword for x86_64 }
- if assigned(currsym) then
- inc(l,currsym.address);
- {$pop}
- { when it is a forward jump we need to compensate the
- offset of the instruction since the previous time,
- because the symbol address is then still using the
- 'old-style' addressing.
- For backwards jumps this is not required because the
- address of the symbol is already adjusted to the
- new offset }
- if (l>InsOffset) and (LastInsOffset<>-1) then
- inc(l,InsOffset-LastInsOffset);
- { instruction size will then always become 2 (PFV) }
- relsize:=(InsOffset+2)-l;
- if (relsize>=-128) and (relsize<=127) and
- (
- not assigned(currsym) or
- (currsym.objsection=objdata.currobjsec)
- ) then
- ot:=OT_IMM8 or OT_SHORT
- else
- ot:=OT_IMM32 or OT_NEAR;
- end
- else
- ot:=OT_IMM32 or OT_NEAR;
- end;
- end;
- top_local :
- begin
- if (ot and OT_SIZE_MASK)=0 then
- ot:=OT_MEMORY or opsize_2_type[i,opsize]
- else
- ot:=OT_MEMORY or (ot and OT_SIZE_MASK);
- end;
- top_const :
- begin
- // if opcode is a SSE or AVX-instruction then we need a
- // special handling (opsize can different from const-size)
- // (e.g. "pextrw reg/m16, xmmreg, imm8" =>> opsize (16 bit), const-size (8 bit)
- if (InsTabMemRefSizeInfoCache^[opcode].ExistsSSEAVX) and
- (not(InsTabMemRefSizeInfoCache^[opcode].ConstSize in [csiMultiple, csiUnkown])) then
- begin
- case InsTabMemRefSizeInfoCache^[opcode].ConstSize of
- csiNoSize: ot := ot and (not(OT_SIZE_MASK)) or OT_IMMEDIATE;
- csiMem8: ot := ot and (not(OT_SIZE_MASK)) or OT_IMMEDIATE or OT_BITS8;
- csiMem16: ot := ot and (not(OT_SIZE_MASK)) or OT_IMMEDIATE or OT_BITS16;
- csiMem32: ot := ot and (not(OT_SIZE_MASK)) or OT_IMMEDIATE or OT_BITS32;
- csiMem64: ot := ot and (not(OT_SIZE_MASK)) or OT_IMMEDIATE or OT_BITS64;
- end;
- end
- else
- begin
- { allow 2nd, 3rd or 4th operand being a constant and expect no size for shuf* etc. }
- { further, allow AAD and AAM with imm. operand }
- if (opsize=S_NO) and not((i in [1,2,3])
- {$ifndef x86_64}
- or ((i=0) and (opcode in [A_AAD,A_AAM]))
- {$endif x86_64}
- ) then
- message(asmr_e_invalid_opcode_and_operand);
- if (opsize<>S_W) and (aint(val)>=-128) and (val<=127) then
- ot:=OT_IMM8 or OT_SIGNED
- else
- ot:=OT_IMMEDIATE or opsize_2_type[i,opsize];
- if (val=1) and (i=1) then
- ot := ot or OT_ONENESS;
- end;
- end;
- top_none :
- begin
- { generated when there was an error in the
- assembler reader. It never happends when generating
- assembler }
- end;
- else
- internalerror(200402266);
- end;
- end;
- end;
- function taicpu.InsEnd:longint;
- begin
- InsEnd:=InsOffset+InsSize;
- end;
- function taicpu.Matches(p:PInsEntry):boolean;
- { * IF_SM stands for Size Match: any operand whose size is not
- * explicitly specified by the template is `really' intended to be
- * the same size as the first size-specified operand.
- * Non-specification is tolerated in the input instruction, but
- * _wrong_ specification is not.
- *
- * IF_SM2 invokes Size Match on only the first _two_ operands, for
- * three-operand instructions such as SHLD: it implies that the
- * first two operands must match in size, but that the third is
- * required to be _unspecified_.
- *
- * IF_SB invokes Size Byte: operands with unspecified size in the
- * template are really bytes, and so no non-byte specification in
- * the input instruction will be tolerated. IF_SW similarly invokes
- * Size Word, and IF_SD invokes Size Doubleword.
- *
- * (The default state if neither IF_SM nor IF_SM2 is specified is
- * that any operand with unspecified size in the template is
- * required to have unspecified size in the instruction too...)
- }
- var
- insot,
- currot,
- i,j,asize,oprs : longint;
- insflags:cardinal;
- siz : array[0..max_operands-1] of longint;
- begin
- result:=false;
- { Check the opcode and operands }
- if (p^.opcode<>opcode) or (p^.ops<>ops) then
- exit;
- for i:=0 to p^.ops-1 do
- begin
- insot:=p^.optypes[i];
- currot:=oper[i]^.ot;
- { Check the operand flags }
- if (insot and (not currot) and OT_NON_SIZE)<>0 then
- exit;
- { Check if the passed operand size matches with one of
- the supported operand sizes }
- if ((insot and OT_SIZE_MASK)<>0) and
- ((insot and currot and OT_SIZE_MASK)<>(currot and OT_SIZE_MASK)) then
- exit;
- end;
- { Check operand sizes }
- insflags:=p^.flags;
- if insflags and IF_SMASK<>0 then
- begin
- { as default an untyped size can get all the sizes, this is different
- from nasm, but else we need to do a lot checking which opcodes want
- size or not with the automatic size generation }
- asize:=-1;
- if (insflags and IF_SB)<>0 then
- asize:=OT_BITS8
- else if (insflags and IF_SW)<>0 then
- asize:=OT_BITS16
- else if (insflags and IF_SD)<>0 then
- asize:=OT_BITS32;
- if (insflags and IF_ARMASK)<>0 then
- begin
- siz[0]:=-1;
- siz[1]:=-1;
- siz[2]:=-1;
- siz[((insflags and IF_ARMASK) shr IF_ARSHIFT)-1]:=asize;
- end
- else
- begin
- siz[0]:=asize;
- siz[1]:=asize;
- siz[2]:=asize;
- end;
- if (insflags and (IF_SM or IF_SM2))<>0 then
- begin
- if (insflags and IF_SM2)<>0 then
- oprs:=2
- else
- oprs:=p^.ops;
- for i:=0 to oprs-1 do
- if ((p^.optypes[i] and OT_SIZE_MASK) <> 0) then
- begin
- for j:=0 to oprs-1 do
- siz[j]:=p^.optypes[i] and OT_SIZE_MASK;
- break;
- end;
- end
- else
- oprs:=2;
- { Check operand sizes }
- for i:=0 to p^.ops-1 do
- begin
- insot:=p^.optypes[i];
- currot:=oper[i]^.ot;
- if ((insot and OT_SIZE_MASK)=0) and
- ((currot and OT_SIZE_MASK and (not siz[i]))<>0) and
- { Immediates can always include smaller size }
- ((currot and OT_IMMEDIATE)=0) and
- (((insot and OT_SIZE_MASK) or siz[i])<(currot and OT_SIZE_MASK)) then
- exit;
- end;
- end;
- if (InsTabMemRefSizeInfoCache^[opcode].MemRefSize in MemRefMultiples) and
- (InsTabMemRefSizeInfoCache^[opcode].ExistsSSEAVX) then
- begin
- for i:=0 to p^.ops-1 do
- begin
- insot:=p^.optypes[i];
- if ((insot and OT_XMMRM) = OT_XMMRM) OR
- ((insot and OT_YMMRM) = OT_YMMRM) then
- begin
- if (insot and OT_SIZE_MASK) = 0 then
- begin
- case insot and (OT_XMMRM or OT_YMMRM) of
- OT_XMMRM: insot := insot or OT_BITS128;
- OT_YMMRM: insot := insot or OT_BITS256;
- end;
- end;
- end;
- currot:=oper[i]^.ot;
- { Check the operand flags }
- if (insot and (not currot) and OT_NON_SIZE)<>0 then
- exit;
- { Check if the passed operand size matches with one of
- the supported operand sizes }
- if ((insot and OT_SIZE_MASK)<>0) and
- ((insot and currot and OT_SIZE_MASK)<>(currot and OT_SIZE_MASK)) then
- exit;
- end;
- end;
- result:=true;
- end;
- procedure taicpu.ResetPass1;
- begin
- { we need to reset everything here, because the choosen insentry
- can be invalid for a new situation where the previously optimized
- insentry is not correct }
- InsEntry:=nil;
- InsSize:=0;
- LastInsOffset:=-1;
- end;
- procedure taicpu.ResetPass2;
- begin
- { we are here in a second pass, check if the instruction can be optimized }
- if assigned(InsEntry) and
- ((InsEntry^.flags and IF_PASS2)<>0) then
- begin
- InsEntry:=nil;
- InsSize:=0;
- end;
- LastInsOffset:=-1;
- end;
- function taicpu.CheckIfValid:boolean;
- begin
- result:=FindInsEntry(nil);
- end;
- function taicpu.FindInsentry(objdata:TObjData):boolean;
- var
- i : longint;
- begin
- result:=false;
- { Things which may only be done once, not when a second pass is done to
- optimize }
- if (Insentry=nil) or ((InsEntry^.flags and IF_PASS2)<>0) then
- begin
- current_filepos:=fileinfo;
- { We need intel style operands }
- SetOperandOrder(op_intel);
- { create the .ot fields }
- create_ot(objdata);
- { set the file postion }
- end
- else
- begin
- { we've already an insentry so it's valid }
- result:=true;
- exit;
- end;
- { Lookup opcode in the table }
- InsSize:=-1;
- i:=instabcache^[opcode];
- if i=-1 then
- begin
- Message1(asmw_e_opcode_not_in_table,gas_op2str[opcode]);
- exit;
- end;
- insentry:=@instab[i];
- while (insentry^.opcode=opcode) do
- begin
- if matches(insentry) then
- begin
- result:=true;
- exit;
- end;
- inc(insentry);
- end;
- Message1(asmw_e_invalid_opcode_and_operands,GetString);
- { No instruction found, set insentry to nil and inssize to -1 }
- insentry:=nil;
- inssize:=-1;
- end;
- function taicpu.Pass1(objdata:TObjData):longint;
- begin
- Pass1:=0;
- { Save the old offset and set the new offset }
- InsOffset:=ObjData.CurrObjSec.Size;
- { Error? }
- if (Insentry=nil) and (InsSize=-1) then
- exit;
- { set the file postion }
- current_filepos:=fileinfo;
- { Get InsEntry }
- if FindInsEntry(ObjData) then
- begin
- { Calculate instruction size }
- InsSize:=calcsize(insentry);
- if segprefix<>NR_NO then
- inc(InsSize);
- { Fix opsize if size if forced }
- if (insentry^.flags and (IF_SB or IF_SW or IF_SD))<>0 then
- begin
- if (insentry^.flags and IF_ARMASK)=0 then
- begin
- if (insentry^.flags and IF_SB)<>0 then
- begin
- if opsize=S_NO then
- opsize:=S_B;
- end
- else if (insentry^.flags and IF_SW)<>0 then
- begin
- if opsize=S_NO then
- opsize:=S_W;
- end
- else if (insentry^.flags and IF_SD)<>0 then
- begin
- if opsize=S_NO then
- opsize:=S_L;
- end;
- end;
- end;
- LastInsOffset:=InsOffset;
- Pass1:=InsSize;
- exit;
- end;
- LastInsOffset:=-1;
- end;
- const
- segprefixes: array[NR_ES..NR_GS] of Byte=(
- // es cs ss ds fs gs
- $26, $2E, $36, $3E, $64, $65
- );
- procedure taicpu.Pass2(objdata:TObjData);
- begin
- { error in pass1 ? }
- if insentry=nil then
- exit;
- current_filepos:=fileinfo;
- { Segment override }
- if (segprefix>=NR_ES) and (segprefix<=NR_GS) then
- begin
- objdata.writebytes(segprefixes[segprefix],1);
- { fix the offset for GenNode }
- inc(InsOffset);
- end
- else if segprefix<>NR_NO then
- InternalError(201001071);
- { Generate the instruction }
- GenCode(objdata);
- end;
- function taicpu.needaddrprefix(opidx:byte):boolean;
- begin
- result:=(oper[opidx]^.typ=top_ref) and
- (oper[opidx]^.ref^.refaddr=addr_no) and
- {$ifdef x86_64}
- (oper[opidx]^.ref^.base<>NR_RIP) and
- {$endif x86_64}
- (
- (
- (oper[opidx]^.ref^.index<>NR_NO) and
- (getsubreg(oper[opidx]^.ref^.index)<>R_SUBADDR)
- ) or
- (
- (oper[opidx]^.ref^.base<>NR_NO) and
- (getsubreg(oper[opidx]^.ref^.base)<>R_SUBADDR)
- )
- );
- end;
- procedure badreg(r:Tregister);
- begin
- Message1(asmw_e_invalid_register,generic_regname(r));
- end;
- function regval(r:Tregister):byte;
- const
- intsupreg2opcode: array[0..7] of byte=
- // ax cx dx bx si di bp sp -- in x86reg.dat
- // ax cx dx bx sp bp si di -- needed order
- (0, 1, 2, 3, 6, 7, 5, 4);
- maxsupreg: array[tregistertype] of tsuperregister=
- {$ifdef x86_64}
- (0, 16, 9, 8, 16, 32, 0);
- {$else x86_64}
- (0, 8, 9, 8, 8, 32, 0);
- {$endif x86_64}
- var
- rs: tsuperregister;
- rt: tregistertype;
- begin
- rs:=getsupreg(r);
- rt:=getregtype(r);
- if (rs>=maxsupreg[rt]) then
- badreg(r);
- result:=rs and 7;
- if (rt=R_INTREGISTER) then
- begin
- if (rs<8) then
- result:=intsupreg2opcode[rs];
- if getsubreg(r)=R_SUBH then
- inc(result,4);
- end;
- end;
- {$ifdef x86_64}
- function rexbits(r: tregister): byte;
- begin
- result:=0;
- case getregtype(r) of
- R_INTREGISTER:
- if (getsupreg(r)>=RS_R8) then
- { Either B,X or R bits can be set, depending on register role in instruction.
- Set all three bits here, caller will discard unnecessary ones. }
- result:=result or $47
- else if (getsubreg(r)=R_SUBL) and
- (getsupreg(r) in [RS_RDI,RS_RSI,RS_RBP,RS_RSP]) then
- result:=result or $40
- else if (getsubreg(r)=R_SUBH) then
- { Not an actual REX bit, used to detect incompatible usage of
- AH/BH/CH/DH }
- result:=result or $80;
- R_MMREGISTER:
- if getsupreg(r)>=RS_XMM8 then
- result:=result or $47;
- end;
- end;
- function process_ea(const input:toper;out output:ea;rfield:longint):boolean;
- var
- sym : tasmsymbol;
- md,s,rv : byte;
- base,index,scalefactor,
- o : longint;
- ir,br : Tregister;
- isub,bsub : tsubregister;
- begin
- process_ea:=false;
- fillchar(output,sizeof(output),0);
- {Register ?}
- if (input.typ=top_reg) then
- begin
- rv:=regval(input.reg);
- output.modrm:=$c0 or (rfield shl 3) or rv;
- output.size:=1;
- output.rex:=output.rex or (rexbits(input.reg) and $F1);
- process_ea:=true;
- exit;
- end;
- {No register, so memory reference.}
- if input.typ<>top_ref then
- internalerror(200409263);
- ir:=input.ref^.index;
- br:=input.ref^.base;
- isub:=getsubreg(ir);
- bsub:=getsubreg(br);
- s:=input.ref^.scalefactor;
- o:=input.ref^.offset;
- sym:=input.ref^.symbol;
- //if ((ir<>NR_NO) and (getregtype(ir)<>R_INTREGISTER)) or
- // ((br<>NR_NO) and (br<>NR_RIP) and (getregtype(br)<>R_INTREGISTER)) then
- if ((ir<>NR_NO) and (getregtype(ir)=R_MMREGISTER) and (br<>NR_NO) and (getregtype(br)<>R_INTREGISTER)) or // vector memory (AVX2)
- ((ir<>NR_NO) and (getregtype(ir)<>R_INTREGISTER) and (getregtype(ir)<>R_MMREGISTER)) or
- ((br<>NR_NO) and (br<>NR_RIP) and (getregtype(br)<>R_INTREGISTER)) then
- internalerror(200301081);
- { it's direct address }
- if (br=NR_NO) and (ir=NR_NO) then
- begin
- output.sib_present:=true;
- output.bytes:=4;
- output.modrm:=4 or (rfield shl 3);
- output.sib:=$25;
- end
- else if (br=NR_RIP) and (ir=NR_NO) then
- begin
- { rip based }
- output.sib_present:=false;
- output.bytes:=4;
- output.modrm:=5 or (rfield shl 3);
- end
- else
- { it's an indirection }
- begin
- { 16 bit? }
- if ((ir<>NR_NO) and (isub in [R_SUBMMX,R_SUBMMY]) and
- (br<>NR_NO) and (bsub=R_SUBADDR)
- ) then
- begin
- // vector memory (AVX2) =>> ignore
- end
- else if ((ir<>NR_NO) and (isub<>R_SUBADDR) and (isub<>R_SUBD)) or
- ((br<>NR_NO) and (bsub<>R_SUBADDR) and (bsub<>R_SUBD)) then
- begin
- message(asmw_e_16bit_32bit_not_supported);
- end;
- { wrong, for various reasons }
- if (ir=NR_ESP) or ((s<>1) and (s<>2) and (s<>4) and (s<>8) and (ir<>NR_NO)) then
- exit;
- output.rex:=output.rex or (rexbits(br) and $F1) or (rexbits(ir) and $F2);
- process_ea:=true;
- { base }
- case br of
- NR_R8D,
- NR_EAX,
- NR_R8,
- NR_RAX : base:=0;
- NR_R9D,
- NR_ECX,
- NR_R9,
- NR_RCX : base:=1;
- NR_R10D,
- NR_EDX,
- NR_R10,
- NR_RDX : base:=2;
- NR_R11D,
- NR_EBX,
- NR_R11,
- NR_RBX : base:=3;
- NR_R12D,
- NR_ESP,
- NR_R12,
- NR_RSP : base:=4;
- NR_R13D,
- NR_EBP,
- NR_R13,
- NR_NO,
- NR_RBP : base:=5;
- NR_R14D,
- NR_ESI,
- NR_R14,
- NR_RSI : base:=6;
- NR_R15D,
- NR_EDI,
- NR_R15,
- NR_RDI : base:=7;
- else
- exit;
- end;
- { index }
- case ir of
- NR_R8D,
- NR_EAX,
- NR_R8,
- NR_RAX,
- NR_XMM0,
- NR_XMM8,
- NR_YMM0,
- NR_YMM8 : index:=0;
- NR_R9D,
- NR_ECX,
- NR_R9,
- NR_RCX,
- NR_XMM1,
- NR_XMM9,
- NR_YMM1,
- NR_YMM9 : index:=1;
- NR_R10D,
- NR_EDX,
- NR_R10,
- NR_RDX,
- NR_XMM2,
- NR_XMM10,
- NR_YMM2,
- NR_YMM10 : index:=2;
- NR_R11D,
- NR_EBX,
- NR_R11,
- NR_RBX,
- NR_XMM3,
- NR_XMM11,
- NR_YMM3,
- NR_YMM11 : index:=3;
- NR_R12D,
- NR_ESP,
- NR_R12,
- NR_NO,
- NR_XMM4,
- NR_XMM12,
- NR_YMM4,
- NR_YMM12 : index:=4;
- NR_R13D,
- NR_EBP,
- NR_R13,
- NR_RBP,
- NR_XMM5,
- NR_XMM13,
- NR_YMM5,
- NR_YMM13: index:=5;
- NR_R14D,
- NR_ESI,
- NR_R14,
- NR_RSI,
- NR_XMM6,
- NR_XMM14,
- NR_YMM6,
- NR_YMM14: index:=6;
- NR_R15D,
- NR_EDI,
- NR_R15,
- NR_RDI,
- NR_XMM7,
- NR_XMM15,
- NR_YMM7,
- NR_YMM15: index:=7;
- else
- exit;
- end;
- case s of
- 0,
- 1 : scalefactor:=0;
- 2 : scalefactor:=1;
- 4 : scalefactor:=2;
- 8 : scalefactor:=3;
- else
- exit;
- end;
- { If rbp or r13 is used we must always include an offset }
- if (br=NR_NO) or
- ((br<>NR_RBP) and (br<>NR_R13) and (br<>NR_EBP) and (br<>NR_R13D) and (o=0) and (sym=nil)) then
- md:=0
- else
- if ((o>=-128) and (o<=127) and (sym=nil)) then
- md:=1
- else
- md:=2;
- if (br=NR_NO) or (md=2) then
- output.bytes:=4
- else
- output.bytes:=md;
- { SIB needed ? }
- if (ir=NR_NO) and (br<>NR_RSP) and (br<>NR_R12) and (br<>NR_ESP) and (br<>NR_R12D) then
- begin
- output.sib_present:=false;
- output.modrm:=(md shl 6) or (rfield shl 3) or base;
- end
- else
- begin
- output.sib_present:=true;
- output.modrm:=(md shl 6) or (rfield shl 3) or 4;
- output.sib:=(scalefactor shl 6) or (index shl 3) or base;
- end;
- end;
- output.size:=1+ord(output.sib_present)+output.bytes;
- process_ea:=true;
- end;
- {$else x86_64}
- function process_ea(const input:toper;out output:ea;rfield:longint):boolean;
- var
- sym : tasmsymbol;
- md,s,rv : byte;
- base,index,scalefactor,
- o : longint;
- ir,br : Tregister;
- isub,bsub : tsubregister;
- begin
- process_ea:=false;
- fillchar(output,sizeof(output),0);
- {Register ?}
- if (input.typ=top_reg) then
- begin
- rv:=regval(input.reg);
- output.modrm:=$c0 or (rfield shl 3) or rv;
- output.size:=1;
- process_ea:=true;
- exit;
- end;
- {No register, so memory reference.}
- if (input.typ<>top_ref) then
- internalerror(200409262);
- if ((input.ref^.index<>NR_NO) and (getregtype(input.ref^.index)=R_MMREGISTER) and (input.ref^.base<>NR_NO) and (getregtype(input.ref^.base)<>R_INTREGISTER)) or // vector memory (AVX2)
- ((input.ref^.index<>NR_NO) and (getregtype(input.ref^.index)<>R_INTREGISTER) and (getregtype(input.ref^.index)<>R_MMREGISTER)) or
- ((input.ref^.base<>NR_NO) and (getregtype(input.ref^.base)<>R_INTREGISTER)) then
- internalerror(200301081);
- ir:=input.ref^.index;
- br:=input.ref^.base;
- isub:=getsubreg(ir);
- bsub:=getsubreg(br);
- s:=input.ref^.scalefactor;
- o:=input.ref^.offset;
- sym:=input.ref^.symbol;
- { it's direct address }
- if (br=NR_NO) and (ir=NR_NO) then
- begin
- { it's a pure offset }
- output.sib_present:=false;
- output.bytes:=4;
- output.modrm:=5 or (rfield shl 3);
- end
- else
- { it's an indirection }
- begin
- { 16 bit address? }
- if ((ir<>NR_NO) and (isub in [R_SUBMMX,R_SUBMMY]) and
- (br<>NR_NO) and (bsub=R_SUBADDR)
- ) then
- begin
- // vector memory (AVX2) =>> ignore
- end
- else if ((ir<>NR_NO) and (isub<>R_SUBADDR)) or
- ((br<>NR_NO) and (bsub<>R_SUBADDR)) then
- message(asmw_e_16bit_not_supported);
- {$ifdef OPTEA}
- { make single reg base }
- if (br=NR_NO) and (s=1) then
- begin
- br:=ir;
- ir:=NR_NO;
- end;
- { convert [3,5,9]*EAX to EAX+[2,4,8]*EAX }
- if (br=NR_NO) and
- (((s=2) and (ir<>NR_ESP)) or
- (s=3) or (s=5) or (s=9)) then
- begin
- br:=ir;
- dec(s);
- end;
- { swap ESP into base if scalefactor is 1 }
- if (s=1) and (ir=NR_ESP) then
- begin
- ir:=br;
- br:=NR_ESP;
- end;
- {$endif OPTEA}
- { wrong, for various reasons }
- if (ir=NR_ESP) or ((s<>1) and (s<>2) and (s<>4) and (s<>8) and (ir<>NR_NO)) then
- exit;
- { base }
- case br of
- NR_EAX : base:=0;
- NR_ECX : base:=1;
- NR_EDX : base:=2;
- NR_EBX : base:=3;
- NR_ESP : base:=4;
- NR_NO,
- NR_EBP : base:=5;
- NR_ESI : base:=6;
- NR_EDI : base:=7;
- else
- exit;
- end;
- { index }
- case ir of
- NR_EAX,
- NR_XMM0,
- NR_YMM0: index:=0;
- NR_ECX,
- NR_XMM1,
- NR_YMM1: index:=1;
- NR_EDX,
- NR_XMM2,
- NR_YMM2: index:=2;
- NR_EBX,
- NR_XMM3,
- NR_YMM3: index:=3;
- NR_NO,
- NR_XMM4,
- NR_YMM4: index:=4;
- NR_EBP,
- NR_XMM5,
- NR_YMM5: index:=5;
- NR_ESI,
- NR_XMM6,
- NR_YMM6: index:=6;
- NR_EDI,
- NR_XMM7,
- NR_YMM7: index:=7;
- else
- exit;
- end;
- case s of
- 0,
- 1 : scalefactor:=0;
- 2 : scalefactor:=1;
- 4 : scalefactor:=2;
- 8 : scalefactor:=3;
- else
- exit;
- end;
- if (br=NR_NO) or
- ((br<>NR_EBP) and (o=0) and (sym=nil)) then
- md:=0
- else
- if ((o>=-128) and (o<=127) and (sym=nil)) then
- md:=1
- else
- md:=2;
- if (br=NR_NO) or (md=2) then
- output.bytes:=4
- else
- output.bytes:=md;
- { SIB needed ? }
- if (ir=NR_NO) and (br<>NR_ESP) then
- begin
- output.sib_present:=false;
- output.modrm:=(longint(md) shl 6) or (rfield shl 3) or base;
- end
- else
- begin
- output.sib_present:=true;
- output.modrm:=(longint(md) shl 6) or (rfield shl 3) or 4;
- output.sib:=(scalefactor shl 6) or (index shl 3) or base;
- end;
- end;
- if output.sib_present then
- output.size:=2+output.bytes
- else
- output.size:=1+output.bytes;
- process_ea:=true;
- end;
- {$endif x86_64}
- function taicpu.calcsize(p:PInsEntry):shortint;
- var
- codes : pchar;
- c : byte;
- len : shortint;
- ea_data : ea;
- exists_vex: boolean;
- exists_vex_extension: boolean;
- exists_prefix_66: boolean;
- exists_prefix_F2: boolean;
- exists_prefix_F3: boolean;
- {$ifdef x86_64}
- omit_rexw : boolean;
- {$endif x86_64}
- begin
- len:=0;
- codes:=@p^.code[0];
- exists_vex := false;
- exists_vex_extension := false;
- exists_prefix_66 := false;
- exists_prefix_F2 := false;
- exists_prefix_F3 := false;
- {$ifdef x86_64}
- rex:=0;
- omit_rexw:=false;
- {$endif x86_64}
- repeat
- c:=ord(codes^);
- inc(codes);
- case c of
- 0 :
- break;
- 1,2,3 :
- begin
- inc(codes,c);
- inc(len,c);
- end;
- 8,9,10 :
- begin
- {$ifdef x86_64}
- rex:=rex or (rexbits(oper[c-8]^.reg) and $F1);
- {$endif x86_64}
- inc(codes);
- inc(len);
- end;
- 11 :
- begin
- inc(codes);
- inc(len);
- end;
- 4,5,6,7 :
- begin
- if opsize=S_W then
- inc(len,2)
- else
- inc(len);
- end;
- 12,13,14,
- 16,17,18,
- 20,21,22,23,
- 40,41,42 :
- inc(len);
- 24,25,26,
- 31,
- 48,49,50 :
- inc(len,2);
- 28,29,30:
- begin
- if opsize=S_Q then
- inc(len,8)
- else
- inc(len,4);
- end;
- 36,37,38:
- inc(len,sizeof(pint));
- 44,45,46:
- inc(len,8);
- 32,33,34,
- 52,53,54,
- 56,57,58,
- 172,173,174 :
- inc(len,4);
- 60,61,62,63: ; // ignore vex-coded operand-idx
- 208,209,210 :
- begin
- case (oper[c-208]^.ot and OT_SIZE_MASK) of
- OT_BITS16:
- inc(len);
- {$ifdef x86_64}
- OT_BITS64:
- begin
- rex:=rex or $48;
- end;
- {$endif x86_64}
- end;
- end;
- 200 :
- {$ifndef x86_64}
- inc(len);
- {$else x86_64}
- { every insentry with code 0310 must be marked with NOX86_64 }
- InternalError(2011051301);
- {$endif x86_64}
- 201 :
- {$ifdef x86_64}
- inc(len)
- {$endif x86_64}
- ;
- 212 :
- inc(len);
- 214 :
- begin
- {$ifdef x86_64}
- rex:=rex or $48;
- {$endif x86_64}
- end;
- 202,
- 211,
- 213,
- 215,
- 217,218: ;
- 219:
- begin
- inc(len);
- exists_prefix_F2 := true;
- end;
- 220:
- begin
- inc(len);
- exists_prefix_F3 := true;
- end;
- 241:
- begin
- inc(len);
- exists_prefix_66 := true;
- end;
- 221:
- {$ifdef x86_64}
- omit_rexw:=true
- {$endif x86_64}
- ;
- 64..151 :
- begin
- {$ifdef x86_64}
- if (c<127) then
- begin
- if (oper[c and 7]^.typ=top_reg) then
- begin
- rex:=rex or (rexbits(oper[c and 7]^.reg) and $F4);
- end;
- end;
- {$endif x86_64}
- if not process_ea(oper[(c shr 3) and 7]^, ea_data, 0) then
- Message(asmw_e_invalid_effective_address)
- else
- inc(len,ea_data.size);
- {$ifdef x86_64}
- rex:=rex or ea_data.rex;
- {$endif x86_64}
- end;
- 242: // VEX prefix for AVX (length = 2 or 3 bytes, dependens on REX.XBW or opcode-prefix ($0F38 or $0F3A))
- // =>> DEFAULT = 2 Bytes
- begin
- if not(exists_vex) then
- begin
- inc(len, 2);
- exists_vex := true;
- end;
- end;
- 243: // REX.W = 1
- // =>> VEX prefix length = 3
- begin
- if not(exists_vex_extension) then
- begin
- inc(len);
- exists_vex_extension := true;
- end;
- end;
- 244: ; // VEX length bit
- 246, // operand 2 (ymmreg) encoded immediate byte (bit 4-7)
- 247: inc(len); // operand 3 (ymmreg) encoded immediate byte (bit 4-7)
- 248: // VEX-Extension prefix $0F
- // ignore for calculating length
- ;
- 249, // VEX-Extension prefix $0F38
- 250: // VEX-Extension prefix $0F3A
- begin
- if not(exists_vex_extension) then
- begin
- inc(len);
- exists_vex_extension := true;
- end;
- end;
- 192,193,194:
- begin
- {$ifdef x86_64}
- if (oper[c and 3]^.ot and OT_SIZE_MASK)=OT_BITS32 then
- inc(len);
- {$endif x86_64}
- end;
- else
- InternalError(200603141);
- end;
- until false;
- {$ifdef x86_64}
- if ((rex and $80)<>0) and ((rex and $4F)<>0) then
- Message(asmw_e_bad_reg_with_rex);
- rex:=rex and $4F; { reset extra bits in upper nibble }
- if omit_rexw then
- begin
- if rex=$48 then { remove rex entirely? }
- rex:=0
- else
- rex:=rex and $F7;
- end;
- if not(exists_vex) then
- begin
- if rex<>0 then
- Inc(len);
- end;
- {$endif}
- if exists_vex then
- begin
- if exists_prefix_66 then dec(len);
- if exists_prefix_F2 then dec(len);
- if exists_prefix_F3 then dec(len);
- {$ifdef x86_64}
- if not(exists_vex_extension) then
- if rex and $0B <> 0 then inc(len); // REX.WXB <> 0 =>> needed VEX-Extension
- {$endif x86_64}
- end;
- calcsize:=len;
- end;
- procedure taicpu.GenCode(objdata:TObjData);
- {
- * the actual codes (C syntax, i.e. octal):
- * \0 - terminates the code. (Unless it's a literal of course.)
- * \1, \2, \3 - that many literal bytes follow in the code stream
- * \4, \6 - the POP/PUSH (respectively) codes for CS, DS, ES, SS
- * (POP is never used for CS) depending on operand 0
- * \5, \7 - the second byte of POP/PUSH codes for FS, GS, depending
- * on operand 0
- * \10, \11, \12 - a literal byte follows in the code stream, to be added
- * to the register value of operand 0, 1 or 2
- * \13 - a literal byte follows in the code stream, to be added
- * to the condition code value of the instruction.
- * \14, \15, \16 - a signed byte immediate operand, from operand 0, 1 or 2
- * \20, \21, \22 - a byte immediate operand, from operand 0, 1 or 2
- * \24, \25, \26, \27 - an unsigned byte immediate operand, from operand 0, 1, 2 or 3
- * \30, \31, \32 - a word immediate operand, from operand 0, 1 or 2
- * \34, \35, \36 - select between \3[012] and \4[012] depending on 16/32 bit
- * assembly mode or the address-size override on the operand
- * \37 - a word constant, from the _segment_ part of operand 0
- * \40, \41, \42 - a long immediate operand, from operand 0, 1 or 2
- * \44, \45, \46 - select between \3[012], \4[012] or \5[456] depending
- on the address size of instruction
- * \50, \51, \52 - a byte relative operand, from operand 0, 1 or 2
- * \54, \55, \56 - a qword immediate, from operand 0, 1 or 2
- * \60, \61, \62 - a word relative operand, from operand 0, 1 or 2
- * \64, \65, \66 - select between \6[012] and \7[012] depending on 16/32 bit
- * assembly mode or the address-size override on the operand
- * \70, \71, \72 - a long relative operand, from operand 0, 1 or 2
- * \74, \75, \76 - a vex-coded vector operand, from operand 0, 1 or 2
- * \1ab - a ModRM, calculated on EA in operand a, with the spare
- * field the register value of operand b.
- * \2ab - a ModRM, calculated on EA in operand a, with the spare
- * field equal to digit b.
- * \254,\255,\256 - a signed 32-bit immediate to be extended to 64 bits
- * \300,\301,\302 - might be an 0x67, depending on the address size of
- * the memory reference in operand x.
- * \310 - indicates fixed 16-bit address size, i.e. optional 0x67.
- * \311 - indicates fixed 32-bit address size, i.e. optional 0x67.
- * \312 - (disassembler only) invalid with non-default address size.
- * \320,\321,\322 - might be an 0x66 or 0x48 byte, depending on the operand
- * size of operand x.
- * \324 - indicates fixed 16-bit operand size, i.e. optional 0x66.
- * \325 - indicates fixed 32-bit operand size, i.e. optional 0x66.
- * \326 - indicates fixed 64-bit operand size, i.e. optional 0x48.
- * \327 - indicates that this instruction is only valid when the
- * operand size is the default (instruction to disassembler,
- * generates no code in the assembler)
- * \331 - instruction not valid with REP prefix. Hint for
- * disassembler only; for SSE instructions.
- * \332 - disassemble a rep (0xF3 byte) prefix as repe not rep.
- * \333 - 0xF3 prefix for SSE instructions
- * \334 - 0xF2 prefix for SSE instructions
- * \335 - Indicates 64-bit operand size with REX.W not necessary
- * \361 - 0x66 prefix for SSE instructions
- * \362 - VEX prefix for AVX instructions
- * \363 - VEX W1
- * \364 - VEX Vector length 256
- * \366 - operand 2 (ymmreg) encoded in bit 4-7 of the immediate byte
- * \367 - operand 3 (ymmreg) encoded in bit 4-7 of the immediate byte
- * \370 - VEX 0F-FLAG
- * \371 - VEX 0F38-FLAG
- * \372 - VEX 0F3A-FLAG
- }
- var
- currval : aint;
- currsym : tobjsymbol;
- currrelreloc,
- currabsreloc,
- currabsreloc32 : TObjRelocationType;
- {$ifdef x86_64}
- rexwritten : boolean;
- {$endif x86_64}
- procedure getvalsym(opidx:longint);
- begin
- case oper[opidx]^.typ of
- top_ref :
- begin
- currval:=oper[opidx]^.ref^.offset;
- currsym:=ObjData.symbolref(oper[opidx]^.ref^.symbol);
- {$ifdef i386}
- if (oper[opidx]^.ref^.refaddr=addr_pic) and
- (tf_pic_uses_got in target_info.flags) then
- begin
- currrelreloc:=RELOC_PLT32;
- currabsreloc:=RELOC_GOT32;
- currabsreloc32:=RELOC_GOT32;
- end
- else
- {$endif i386}
- {$ifdef x86_64}
- if oper[opidx]^.ref^.refaddr=addr_pic then
- begin
- currrelreloc:=RELOC_PLT32;
- currabsreloc:=RELOC_GOTPCREL;
- currabsreloc32:=RELOC_GOTPCREL;
- end
- else if oper[opidx]^.ref^.refaddr=addr_pic_no_got then
- begin
- currrelreloc:=RELOC_RELATIVE;
- currabsreloc:=RELOC_RELATIVE;
- currabsreloc32:=RELOC_RELATIVE;
- end
- else
- {$endif x86_64}
- begin
- currrelreloc:=RELOC_RELATIVE;
- currabsreloc:=RELOC_ABSOLUTE;
- currabsreloc32:=RELOC_ABSOLUTE32;
- end;
- end;
- top_const :
- begin
- currval:=aint(oper[opidx]^.val);
- currsym:=nil;
- currabsreloc:=RELOC_ABSOLUTE;
- currabsreloc32:=RELOC_ABSOLUTE32;
- end;
- else
- Message(asmw_e_immediate_or_reference_expected);
- end;
- end;
- {$ifdef x86_64}
- procedure maybewriterex;
- begin
- if (rex<>0) and not(rexwritten) then
- begin
- rexwritten:=true;
- objdata.writebytes(rex,1);
- end;
- end;
- {$endif x86_64}
- procedure objdata_writereloc(Data:aint;len:aword;p:TObjSymbol;Reloctype:TObjRelocationType);
- begin
- {$ifdef i386}
- { Special case of '_GLOBAL_OFFSET_TABLE_'
- which needs a special relocation type R_386_GOTPC }
- if assigned (p) and
- (p.name='_GLOBAL_OFFSET_TABLE_') and
- (tf_pic_uses_got in target_info.flags) then
- begin
- { nothing else than a 4 byte relocation should occur
- for GOT }
- if len<>4 then
- Message1(asmw_e_invalid_opcode_and_operands,GetString);
- Reloctype:=RELOC_GOTPC;
- { We need to add the offset of the relocation
- of _GLOBAL_OFFSET_TABLE symbol within
- the current instruction }
- inc(data,objdata.currobjsec.size-insoffset);
- end;
- {$endif i386}
- objdata.writereloc(data,len,p,Reloctype);
- end;
- const
- CondVal:array[TAsmCond] of byte=($0,
- $7, $3, $2, $6, $2, $4, $F, $D, $C, $E, $6, $2,
- $3, $7, $3, $5, $E, $C, $D, $F, $1, $B, $9, $5,
- $0, $A, $A, $B, $8, $4);
- var
- c : byte;
- pb : pbyte;
- codes : pchar;
- bytes : array[0..3] of byte;
- rfield,
- data,s,opidx : longint;
- ea_data : ea;
- relsym : TObjSymbol;
- needed_VEX_Extension: boolean;
- needed_VEX: boolean;
- opmode: integer;
- VEXvvvv: byte;
- VEXmmmmm: byte;
- begin
- { safety check }
- if objdata.currobjsec.size<>longword(insoffset) then
- internalerror(200130121);
- { those variables are initialized inside local procedures, the dfa cannot handle this yet }
- currsym:=nil;
- currabsreloc:=RELOC_NONE;
- currabsreloc32:=RELOC_NONE;
- currrelreloc:=RELOC_NONE;
- currval:=0;
- { load data to write }
- codes:=insentry^.code;
- {$ifdef x86_64}
- rexwritten:=false;
- {$endif x86_64}
- { Force word push/pop for registers }
- if (opsize=S_W) and ((codes[0]=#4) or (codes[0]=#6) or
- ((codes[0]=#1) and ((codes[2]=#5) or (codes[2]=#7)))) then
- begin
- bytes[0]:=$66;
- objdata.writebytes(bytes,1);
- end;
- // needed VEX Prefix (for AVX etc.)
- needed_VEX := false;
- needed_VEX_Extension := false;
- opmode := -1;
- VEXvvvv := 0;
- VEXmmmmm := 0;
- repeat
- c:=ord(codes^);
- inc(codes);
- case c of
- 0: break;
- 1,
- 2,
- 3: inc(codes,c);
- 60: opmode := 0;
- 61: opmode := 1;
- 62: opmode := 2;
- 219: VEXvvvv := VEXvvvv OR $02; // set SIMD-prefix $F3
- 220: VEXvvvv := VEXvvvv OR $03; // set SIMD-prefix $F2
- 241: VEXvvvv := VEXvvvv OR $01; // set SIMD-prefix $66
- 242: needed_VEX := true;
- 243: begin
- needed_VEX_Extension := true;
- VEXvvvv := VEXvvvv OR (1 shl 7); // set REX.W
- end;
- 244: VEXvvvv := VEXvvvv OR $04; // vectorlength = 256 bits AND no scalar
- 248: VEXmmmmm := VEXmmmmm OR $01; // set leading opcode byte $0F
- 249: begin
- needed_VEX_Extension := true;
- VEXmmmmm := VEXmmmmm OR $02; // set leading opcode byte $0F38
- end;
- 250: begin
- needed_VEX_Extension := true;
- VEXmmmmm := VEXmmmmm OR $03; // set leading opcode byte $0F3A
- end;
- end;
- until false;
- if needed_VEX then
- begin
- if (opmode > ops) or
- (opmode < -1) then
- begin
- Internalerror(777100);
- end
- else if opmode = -1 then
- begin
- VEXvvvv := VEXvvvv or ($0F shl 3); // set VEXvvvv bits (bits 6-3) to 1
- end
- else if oper[opmode]^.typ = top_reg then
- begin
- VEXvvvv := VEXvvvv or ((not(regval(oper[opmode]^.reg)) and $07) shl 3);
- {$ifdef x86_64}
- if rexbits(oper[opmode]^.reg) = 0 then VEXvvvv := VEXvvvv or (1 shl 6);
- {$else}
- VEXvvvv := VEXvvvv or (1 shl 6);
- {$endif x86_64}
- end
- else Internalerror(777101);
- if not(needed_VEX_Extension) then
- begin
- {$ifdef x86_64}
- if rex and $0B <> 0 then needed_VEX_Extension := true;
- {$endif x86_64}
- end;
- if needed_VEX_Extension then
- begin
- // VEX-Prefix-Length = 3 Bytes
- bytes[0]:=$C4;
- objdata.writebytes(bytes,1);
- {$ifdef x86_64}
- VEXmmmmm := VEXmmmmm or ((not(rex) and $07) shl 5); // set REX.rxb
- {$else}
- VEXmmmmm := VEXmmmmm or (7 shl 5); //
- {$endif x86_64}
- bytes[0] := VEXmmmmm;
- objdata.writebytes(bytes,1);
- {$ifdef x86_64}
- VEXvvvv := VEXvvvv OR ((rex and $08) shl 7); // set REX.w
- {$endif x86_64}
- bytes[0] := VEXvvvv;
- objdata.writebytes(bytes,1);
- end
- else
- begin
- // VEX-Prefix-Length = 2 Bytes
- bytes[0]:=$C5;
- objdata.writebytes(bytes,1);
- {$ifdef x86_64}
- if rex and $04 = 0 then
- {$endif x86_64}
- begin
- VEXvvvv := VEXvvvv or (1 shl 7);
- end;
- bytes[0] := VEXvvvv;
- objdata.writebytes(bytes,1);
- end;
- end
- else
- begin
- needed_VEX_Extension := false;
- opmode := -1;
- end;
- { load data to write }
- codes:=insentry^.code;
- repeat
- c:=ord(codes^);
- inc(codes);
- case c of
- 0 :
- break;
- 1,2,3 :
- begin
- {$ifdef x86_64}
- if not(needed_VEX) then // TG
- maybewriterex;
- {$endif x86_64}
- objdata.writebytes(codes^,c);
- inc(codes,c);
- end;
- 4,6 :
- begin
- case oper[0]^.reg of
- NR_CS:
- bytes[0]:=$e;
- NR_NO,
- NR_DS:
- bytes[0]:=$1e;
- NR_ES:
- bytes[0]:=$6;
- NR_SS:
- bytes[0]:=$16;
- else
- internalerror(777004);
- end;
- if c=4 then
- inc(bytes[0]);
- objdata.writebytes(bytes,1);
- end;
- 5,7 :
- begin
- case oper[0]^.reg of
- NR_FS:
- bytes[0]:=$a0;
- NR_GS:
- bytes[0]:=$a8;
- else
- internalerror(777005);
- end;
- if c=5 then
- inc(bytes[0]);
- objdata.writebytes(bytes,1);
- end;
- 8,9,10 :
- begin
- {$ifdef x86_64}
- if not(needed_VEX) then // TG
- maybewriterex;
- {$endif x86_64}
- bytes[0]:=ord(codes^)+regval(oper[c-8]^.reg);
- inc(codes);
- objdata.writebytes(bytes,1);
- end;
- 11 :
- begin
- bytes[0]:=ord(codes^)+condval[condition];
- inc(codes);
- objdata.writebytes(bytes,1);
- end;
- 12,13,14 :
- begin
- getvalsym(c-12);
- if (currval<-128) or (currval>127) then
- Message2(asmw_e_value_exceeds_bounds,'signed byte',tostr(currval));
- if assigned(currsym) then
- objdata_writereloc(currval,1,currsym,currabsreloc)
- else
- objdata.writebytes(currval,1);
- end;
- 16,17,18 :
- begin
- getvalsym(c-16);
- if (currval<-256) or (currval>255) then
- Message2(asmw_e_value_exceeds_bounds,'byte',tostr(currval));
- if assigned(currsym) then
- objdata_writereloc(currval,1,currsym,currabsreloc)
- else
- objdata.writebytes(currval,1);
- end;
- 20,21,22,23 :
- begin
- getvalsym(c-20);
- if (currval<0) or (currval>255) then
- Message2(asmw_e_value_exceeds_bounds,'unsigned byte',tostr(currval));
- if assigned(currsym) then
- objdata_writereloc(currval,1,currsym,currabsreloc)
- else
- objdata.writebytes(currval,1);
- end;
- 24,25,26 : // 030..032
- begin
- getvalsym(c-24);
- {$ifndef i8086}
- { currval is an aint so this cannot happen on i8086 and causes only a warning }
- if (currval<-65536) or (currval>65535) then
- Message2(asmw_e_value_exceeds_bounds,'word',tostr(currval));
- {$endif i8086}
- if assigned(currsym) then
- objdata_writereloc(currval,2,currsym,currabsreloc)
- else
- objdata.writebytes(currval,2);
- end;
- 28,29,30 : // 034..036
- { !!! These are intended (and used in opcode table) to select depending
- on address size, *not* operand size. Works by coincidence only. }
- begin
- getvalsym(c-28);
- if opsize=S_Q then
- begin
- if assigned(currsym) then
- objdata_writereloc(currval,8,currsym,currabsreloc)
- else
- objdata.writebytes(currval,8);
- end
- else
- begin
- if assigned(currsym) then
- objdata_writereloc(currval,4,currsym,currabsreloc32)
- else
- objdata.writebytes(currval,4);
- end
- end;
- 32,33,34 : // 040..042
- begin
- getvalsym(c-32);
- if assigned(currsym) then
- objdata_writereloc(currval,4,currsym,currabsreloc32)
- else
- objdata.writebytes(currval,4);
- end;
- 36,37,38 : // 044..046 - select between word/dword/qword depending on
- begin // address size (we support only default address sizes).
- getvalsym(c-36);
- {$ifdef x86_64}
- if assigned(currsym) then
- objdata_writereloc(currval,8,currsym,currabsreloc)
- else
- objdata.writebytes(currval,8);
- {$else x86_64}
- if assigned(currsym) then
- objdata_writereloc(currval,4,currsym,currabsreloc32)
- else
- objdata.writebytes(currval,4);
- {$endif x86_64}
- end;
- 40,41,42 : // 050..052 - byte relative operand
- begin
- getvalsym(c-40);
- data:=currval-insend;
- {$push}
- {$r-,q-} { disable also overflow as address returns a qword for x86_64 }
- if assigned(currsym) then
- inc(data,currsym.address);
- {$pop}
- if (data>127) or (data<-128) then
- Message1(asmw_e_short_jmp_out_of_range,tostr(data));
- objdata.writebytes(data,1);
- end;
- 44,45,46: // 054..056 - qword immediate operand
- begin
- getvalsym(c-44);
- if assigned(currsym) then
- objdata_writereloc(currval,8,currsym,currabsreloc)
- else
- objdata.writebytes(currval,8);
- end;
- 52,53,54 : // 064..066 - select between 16/32 address mode, but we support only 32
- begin
- getvalsym(c-52);
- if assigned(currsym) then
- objdata_writereloc(currval,4,currsym,currrelreloc)
- else
- objdata_writereloc(currval-insend,4,nil,currabsreloc32)
- end;
- 56,57,58 : // 070..072 - long relative operand
- begin
- getvalsym(c-56);
- if assigned(currsym) then
- objdata_writereloc(currval,4,currsym,currrelreloc)
- else
- objdata_writereloc(currval-insend,4,nil,currabsreloc32)
- end;
- 60,61,62 : ; // 074..076 - vex-coded vector operand
- // ignore
- 172,173,174 : // 0254..0256 - dword implicitly sign-extended to 64-bit (x86_64 only)
- begin
- getvalsym(c-172);
- {$ifdef x86_64}
- { for i386 as aint type is longint the
- following test is useless }
- if (currval<low(longint)) or (currval>high(longint)) then
- Message2(asmw_e_value_exceeds_bounds,'signed dword',tostr(currval));
- {$endif x86_64}
- if assigned(currsym) then
- objdata_writereloc(currval,4,currsym,currabsreloc32)
- else
- objdata.writebytes(currval,4);
- end;
- 192,193,194:
- begin
- {$ifdef x86_64}
- if (oper[c and 3]^.ot and OT_SIZE_MASK)=OT_BITS32 then
- begin
- bytes[0]:=$67;
- objdata.writebytes(bytes,1);
- end;
- {$endif x86_64}
- end;
- 200 : { fixed 16-bit addr }
- {$ifndef x86_64}
- begin
- bytes[0]:=$67;
- objdata.writebytes(bytes,1);
- end;
- {$else x86_64}
- { every insentry having code 0310 must be marked with NOX86_64 }
- InternalError(2011051302);
- {$endif}
- 201 : { fixed 32-bit addr }
- {$ifdef x86_64}
- begin
- bytes[0]:=$67;
- objdata.writebytes(bytes,1);
- end
- {$endif x86_64}
- ;
- 208,209,210 :
- begin
- case oper[c-208]^.ot and OT_SIZE_MASK of
- OT_BITS16 :
- begin
- bytes[0]:=$66;
- objdata.writebytes(bytes,1);
- end;
- {$ifndef x86_64}
- OT_BITS64 :
- Message(asmw_e_64bit_not_supported);
- {$endif x86_64}
- end;
- end;
- 211,
- 213 : {no action needed};
- 212,
- 241:
- begin
- if not(needed_VEX) then
- begin
- bytes[0]:=$66;
- objdata.writebytes(bytes,1);
- end;
- end;
- 214 :
- begin
- {$ifndef x86_64}
- Message(asmw_e_64bit_not_supported);
- {$endif x86_64}
- end;
- 219 :
- begin
- if not(needed_VEX) then
- begin
- bytes[0]:=$f3;
- objdata.writebytes(bytes,1);
- end;
- end;
- 220 :
- begin
- if not(needed_VEX) then
- begin
- bytes[0]:=$f2;
- objdata.writebytes(bytes,1);
- end;
- end;
- 221:
- ;
- 202,
- 215,
- 217,218 :
- begin
- { these are dissambler hints or 32 bit prefixes which
- are not needed }
- end;
- 242..244: ; // VEX flags =>> nothing todo
- 246: begin
- if needed_VEX then
- begin
- if ops = 4 then
- begin
- if (oper[2]^.typ=top_reg) then
- begin
- if (oper[2]^.ot and otf_reg_xmm <> 0) or
- (oper[2]^.ot and otf_reg_ymm <> 0) then
- begin
- bytes[0] := ((getsupreg(oper[2]^.reg) and 15) shl 4);
- objdata.writebytes(bytes,1);
- end
- else Internalerror(2014032001);
- end
- else Internalerror(2014032002);
- end
- else Internalerror(2014032003);
- end
- else Internalerror(2014032004);
- end;
- 247: begin
- if needed_VEX then
- begin
- if ops = 4 then
- begin
- if (oper[3]^.typ=top_reg) then
- begin
- if (oper[3]^.ot and otf_reg_xmm <> 0) or
- (oper[3]^.ot and otf_reg_ymm <> 0) then
- begin
- bytes[0] := ((getsupreg(oper[3]^.reg) and 15) shl 4);
- objdata.writebytes(bytes,1);
- end
- else Internalerror(2014032005);
- end
- else Internalerror(2014032006);
- end
- else Internalerror(2014032007);
- end
- else Internalerror(2014032008);
- end;
- 248..250: ; // VEX flags =>> nothing todo
- 31,
- 48,49,50 :
- begin
- InternalError(777006);
- end
- else
- begin
- { rex should be written at this point }
- {$ifdef x86_64}
- if not(needed_VEX) then // TG
- if (rex<>0) and not(rexwritten) then
- internalerror(200603191);
- {$endif x86_64}
- if (c>=64) and (c<=151) then // 0100..0227
- begin
- if (c<127) then // 0177
- begin
- if (oper[c and 7]^.typ=top_reg) then
- rfield:=regval(oper[c and 7]^.reg)
- else
- rfield:=regval(oper[c and 7]^.ref^.base);
- end
- else
- rfield:=c and 7;
- opidx:=(c shr 3) and 7;
- if not process_ea(oper[opidx]^,ea_data,rfield) then
- Message(asmw_e_invalid_effective_address);
- pb:=@bytes[0];
- pb^:=ea_data.modrm;
- inc(pb);
- if ea_data.sib_present then
- begin
- pb^:=ea_data.sib;
- inc(pb);
- end;
- s:=pb-@bytes[0];
- objdata.writebytes(bytes,s);
- case ea_data.bytes of
- 0 : ;
- 1 :
- begin
- if (oper[opidx]^.ot and OT_MEMORY)=OT_MEMORY then
- begin
- currsym:=objdata.symbolref(oper[opidx]^.ref^.symbol);
- {$ifdef i386}
- if (oper[opidx]^.ref^.refaddr=addr_pic) and
- (tf_pic_uses_got in target_info.flags) then
- currabsreloc:=RELOC_GOT32
- else
- {$endif i386}
- {$ifdef x86_64}
- if oper[opidx]^.ref^.refaddr=addr_pic then
- currabsreloc:=RELOC_GOTPCREL
- else
- {$endif x86_64}
- currabsreloc:=RELOC_ABSOLUTE;
- objdata_writereloc(oper[opidx]^.ref^.offset,1,currsym,currabsreloc);
- end
- else
- begin
- bytes[0]:=oper[opidx]^.ref^.offset;
- objdata.writebytes(bytes,1);
- end;
- inc(s);
- end;
- 2,4 :
- begin
- currsym:=objdata.symbolref(oper[opidx]^.ref^.symbol);
- currval:=oper[opidx]^.ref^.offset;
- {$ifdef x86_64}
- if oper[opidx]^.ref^.refaddr=addr_pic then
- currabsreloc:=RELOC_GOTPCREL
- else
- if oper[opidx]^.ref^.base=NR_RIP then
- begin
- currabsreloc:=RELOC_RELATIVE;
- { Adjust reloc value by number of bytes following the displacement,
- but not if displacement is specified by literal constant }
- if Assigned(currsym) then
- Dec(currval,InsEnd-objdata.CurrObjSec.Size-ea_data.bytes);
- end
- else
- {$endif x86_64}
- {$ifdef i386}
- if (oper[opidx]^.ref^.refaddr=addr_pic) and
- (tf_pic_uses_got in target_info.flags) then
- currabsreloc:=RELOC_GOT32
- else
- {$endif i386}
- currabsreloc:=RELOC_ABSOLUTE32;
- if (currabsreloc=RELOC_ABSOLUTE32) and
- (Assigned(oper[opidx]^.ref^.relsymbol)) then
- begin
- relsym:=objdata.symbolref(oper[opidx]^.ref^.relsymbol);
- if relsym.objsection=objdata.CurrObjSec then
- begin
- currval:=objdata.CurrObjSec.size+ea_data.bytes-relsym.offset+currval;
- currabsreloc:=RELOC_RELATIVE;
- end
- else
- begin
- currabsreloc:=RELOC_PIC_PAIR;
- currval:=relsym.offset;
- end;
- end;
- objdata_writereloc(currval,ea_data.bytes,currsym,currabsreloc);
- inc(s,ea_data.bytes);
- end;
- end;
- end
- else
- InternalError(777007);
- end;
- end;
- until false;
- end;
- function taicpu.is_same_reg_move(regtype: Tregistertype):boolean;
- begin
- result:=(((opcode=A_MOV) or (opcode=A_XCHG)) and
- (regtype = R_INTREGISTER) and
- (ops=2) and
- (oper[0]^.typ=top_reg) and
- (oper[1]^.typ=top_reg) and
- (oper[0]^.reg=oper[1]^.reg)
- ) or
- (((opcode=A_MOVSS) or (opcode=A_MOVSD) or (opcode=A_MOVQ) or
- (opcode=A_MOVAPS) or (OPCODE=A_MOVAPD) or
- (opcode=A_VMOVSS) or (opcode=A_VMOVSD) or (opcode=A_VMOVQ) or
- (opcode=A_VMOVAPS) or (OPCODE=A_VMOVAPD)) and
- (regtype = R_MMREGISTER) and
- (ops=2) and
- (oper[0]^.typ=top_reg) and
- (oper[1]^.typ=top_reg) and
- (oper[0]^.reg=oper[1]^.reg)
- );
- end;
- procedure build_spilling_operation_type_table;
- var
- opcode : tasmop;
- i : integer;
- begin
- new(operation_type_table);
- fillchar(operation_type_table^,sizeof(toperation_type_table),byte(operand_read));
- for opcode:=low(tasmop) to high(tasmop) do
- begin
- for i:=1 to MaxInsChanges do
- begin
- case InsProp[opcode].Ch[i] of
- Ch_Rop1 :
- operation_type_table^[opcode,0]:=operand_read;
- Ch_Wop1 :
- operation_type_table^[opcode,0]:=operand_write;
- Ch_RWop1,
- Ch_Mop1 :
- operation_type_table^[opcode,0]:=operand_readwrite;
- Ch_Rop2 :
- operation_type_table^[opcode,1]:=operand_read;
- Ch_Wop2 :
- operation_type_table^[opcode,1]:=operand_write;
- Ch_RWop2,
- Ch_Mop2 :
- operation_type_table^[opcode,1]:=operand_readwrite;
- Ch_Rop3 :
- operation_type_table^[opcode,2]:=operand_read;
- Ch_Wop3 :
- operation_type_table^[opcode,2]:=operand_write;
- Ch_RWop3,
- Ch_Mop3 :
- operation_type_table^[opcode,2]:=operand_readwrite;
- end;
- end;
- end;
- end;
- function taicpu.spilling_get_operation_type(opnr: longint): topertype;
- begin
- { the information in the instruction table is made for the string copy
- operation MOVSD so hack here (FK)
- VMOVSS and VMOVSD has two and three operand flavours, this cannot modelled by x86ins.dat
- so fix it here (FK)
- }
- if ((opcode=A_MOVSD) or (opcode=A_VMOVSS) or (opcode=A_VMOVSD)) and (ops=2) then
- begin
- case opnr of
- 0:
- result:=operand_read;
- 1:
- result:=operand_write;
- else
- internalerror(200506055);
- end
- end
- { IMUL has 1, 2 and 3-operand forms }
- else if opcode=A_IMUL then
- begin
- case ops of
- 1:
- if opnr=0 then
- result:=operand_read
- else
- internalerror(2014011802);
- 2:
- begin
- case opnr of
- 0:
- result:=operand_read;
- 1:
- result:=operand_readwrite;
- else
- internalerror(2014011803);
- end;
- end;
- 3:
- begin
- case opnr of
- 0,1:
- result:=operand_read;
- 2:
- result:=operand_write;
- else
- internalerror(2014011804);
- end;
- end;
- else
- internalerror(2014011805);
- end;
- end
- else
- result:=operation_type_table^[opcode,opnr];
- end;
- function spilling_create_load(const ref:treference;r:tregister):Taicpu;
- var
- tmpref: treference;
- begin
- tmpref:=ref;
- {$ifdef i8086}
- if tmpref.segment=NR_SS then
- tmpref.segment:=NR_NO;
- {$endif i8086}
- case getregtype(r) of
- R_INTREGISTER :
- begin
- if getsubreg(r)=R_SUBH then
- inc(tmpref.offset);
- { we don't need special code here for 32 bit loads on x86_64, since
- those will automatically zero-extend the upper 32 bits. }
- result:=taicpu.op_ref_reg(A_MOV,reg2opsize(r),tmpref,r);
- end;
- R_MMREGISTER :
- if current_settings.fputype in fpu_avx_instructionsets then
- case getsubreg(r) of
- R_SUBMMD:
- result:=taicpu.op_ref_reg(A_VMOVSD,reg2opsize(r),tmpref,r);
- R_SUBMMS:
- result:=taicpu.op_ref_reg(A_VMOVSS,reg2opsize(r),tmpref,r);
- R_SUBQ,
- R_SUBMMWHOLE:
- result:=taicpu.op_ref_reg(A_VMOVQ,S_NO,tmpref,r);
- else
- internalerror(200506043);
- end
- else
- case getsubreg(r) of
- R_SUBMMD:
- result:=taicpu.op_ref_reg(A_MOVSD,reg2opsize(r),tmpref,r);
- R_SUBMMS:
- result:=taicpu.op_ref_reg(A_MOVSS,reg2opsize(r),tmpref,r);
- R_SUBQ,
- R_SUBMMWHOLE:
- result:=taicpu.op_ref_reg(A_MOVQ,S_NO,tmpref,r);
- else
- internalerror(200506043);
- end;
- else
- internalerror(200401041);
- end;
- end;
- function spilling_create_store(r:tregister; const ref:treference):Taicpu;
- var
- size: topsize;
- tmpref: treference;
- begin
- tmpref:=ref;
- {$ifdef i8086}
- if tmpref.segment=NR_SS then
- tmpref.segment:=NR_NO;
- {$endif i8086}
- case getregtype(r) of
- R_INTREGISTER :
- begin
- if getsubreg(r)=R_SUBH then
- inc(tmpref.offset);
- size:=reg2opsize(r);
- {$ifdef x86_64}
- { even if it's a 32 bit reg, we still have to spill 64 bits
- because we often perform 64 bit operations on them }
- if (size=S_L) then
- begin
- size:=S_Q;
- r:=newreg(getregtype(r),getsupreg(r),R_SUBWHOLE);
- end;
- {$endif x86_64}
- result:=taicpu.op_reg_ref(A_MOV,size,r,tmpref);
- end;
- R_MMREGISTER :
- if current_settings.fputype in fpu_avx_instructionsets then
- case getsubreg(r) of
- R_SUBMMD:
- result:=taicpu.op_reg_ref(A_VMOVSD,reg2opsize(r),r,tmpref);
- R_SUBMMS:
- result:=taicpu.op_reg_ref(A_VMOVSS,reg2opsize(r),r,tmpref);
- R_SUBQ,
- R_SUBMMWHOLE:
- result:=taicpu.op_reg_ref(A_VMOVQ,S_NO,r,tmpref);
- else
- internalerror(200506042);
- end
- else
- case getsubreg(r) of
- R_SUBMMD:
- result:=taicpu.op_reg_ref(A_MOVSD,reg2opsize(r),r,tmpref);
- R_SUBMMS:
- result:=taicpu.op_reg_ref(A_MOVSS,reg2opsize(r),r,tmpref);
- R_SUBQ,
- R_SUBMMWHOLE:
- result:=taicpu.op_reg_ref(A_MOVQ,S_NO,r,tmpref);
- else
- internalerror(200506042);
- end;
- else
- internalerror(200401041);
- end;
- end;
- {*****************************************************************************
- Instruction table
- *****************************************************************************}
- procedure BuildInsTabCache;
- var
- i : longint;
- begin
- new(instabcache);
- FillChar(instabcache^,sizeof(tinstabcache),$ff);
- i:=0;
- while (i<InsTabEntries) do
- begin
- if InsTabCache^[InsTab[i].OPcode]=-1 then
- InsTabCache^[InsTab[i].OPcode]:=i;
- inc(i);
- end;
- end;
- procedure BuildInsTabMemRefSizeInfoCache;
- var
- AsmOp: TasmOp;
- i,j: longint;
- insentry : PInsEntry;
- MRefInfo: TMemRefSizeInfo;
- SConstInfo: TConstSizeInfo;
- actRegSize: int64;
- actMemSize: int64;
- actConstSize: int64;
- actRegCount: integer;
- actMemCount: integer;
- actConstCount: integer;
- actRegTypes : int64;
- actRegMemTypes: int64;
- NewRegSize: int64;
- actVMemCount : integer;
- actVMemTypes : int64;
- RegMMXSizeMask: int64;
- RegXMMSizeMask: int64;
- RegYMMSizeMask: int64;
- bitcount: integer;
- function bitcnt(aValue: int64): integer;
- var
- i: integer;
- begin
- result := 0;
- for i := 0 to 63 do
- begin
- if (aValue mod 2) = 1 then
- begin
- inc(result);
- end;
- aValue := aValue shr 1;
- end;
- end;
- begin
- new(InsTabMemRefSizeInfoCache);
- FillChar(InsTabMemRefSizeInfoCache^,sizeof(TInsTabMemRefSizeInfoCache),0);
- for AsmOp := low(TAsmOp) to high(TAsmOp) do
- begin
- i := InsTabCache^[AsmOp];
- if i >= 0 then
- begin
- InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiUnkown;
- InsTabMemRefSizeInfoCache^[AsmOp].ConstSize := csiUnkown;
- InsTabMemRefSizeInfoCache^[AsmOp].ExistsSSEAVX := false;
- insentry:=@instab[i];
- RegMMXSizeMask := 0;
- RegXMMSizeMask := 0;
- RegYMMSizeMask := 0;
- while (insentry^.opcode=AsmOp) do
- begin
- MRefInfo := msiUnkown;
- actRegSize := 0;
- actRegCount := 0;
- actRegTypes := 0;
- NewRegSize := 0;
- actMemSize := 0;
- actMemCount := 0;
- actRegMemTypes := 0;
- actVMemCount := 0;
- actVMemTypes := 0;
- actConstSize := 0;
- actConstCount := 0;
- for j := 0 to insentry^.ops -1 do
- begin
- if ((insentry^.optypes[j] and OT_XMEM32) = OT_XMEM32) OR
- ((insentry^.optypes[j] and OT_XMEM64) = OT_XMEM64) OR
- ((insentry^.optypes[j] and OT_YMEM32) = OT_YMEM32) OR
- ((insentry^.optypes[j] and OT_YMEM64) = OT_YMEM64) then
- begin
- inc(actVMemCount);
- case insentry^.optypes[j] and (OT_XMEM32 OR OT_XMEM64 OR OT_YMEM32 OR OT_YMEM64) of
- OT_XMEM32: actVMemTypes := actVMemTypes or OT_XMEM32;
- OT_XMEM64: actVMemTypes := actVMemTypes or OT_XMEM64;
- OT_YMEM32: actVMemTypes := actVMemTypes or OT_YMEM32;
- OT_YMEM64: actVMemTypes := actVMemTypes or OT_YMEM64;
- else InternalError(777206);
- end;
- end
- else if (insentry^.optypes[j] and OT_REGISTER) = OT_REGISTER then
- begin
- inc(actRegCount);
- NewRegSize := (insentry^.optypes[j] and OT_SIZE_MASK);
- if NewRegSize = 0 then
- begin
- case insentry^.optypes[j] and (OT_MMXREG OR OT_XMMREG OR OT_YMMREG) of
- OT_MMXREG: begin
- NewRegSize := OT_BITS64;
- end;
- OT_XMMREG: begin
- NewRegSize := OT_BITS128;
- InsTabMemRefSizeInfoCache^[AsmOp].ExistsSSEAVX := true;
- end;
- OT_YMMREG: begin
- NewRegSize := OT_BITS256;
- InsTabMemRefSizeInfoCache^[AsmOp].ExistsSSEAVX := true;
- end;
- else NewRegSize := not(0);
- end;
- end;
- actRegSize := actRegSize or NewRegSize;
- actRegTypes := actRegTypes or (insentry^.optypes[j] and (OT_MMXREG OR OT_XMMREG OR OT_YMMREG));
- end
- else if ((insentry^.optypes[j] and OT_MEMORY) <> 0) then
- begin
- inc(actMemCount);
- actMemSize:=actMemSize or (insentry^.optypes[j] and OT_SIZE_MASK);
- if (insentry^.optypes[j] and OT_REGMEM) = OT_REGMEM then
- begin
- actRegMemTypes := actRegMemTypes or insentry^.optypes[j];
- end;
- end
- else if ((insentry^.optypes[j] and OT_IMMEDIATE) = OT_IMMEDIATE) then
- begin
- inc(actConstCount);
- actConstSize := actConstSize or (insentry^.optypes[j] and OT_SIZE_MASK);
- end
- end;
- if actConstCount > 0 then
- begin
- case actConstSize of
- 0: SConstInfo := csiNoSize;
- OT_BITS8: SConstInfo := csiMem8;
- OT_BITS16: SConstInfo := csiMem16;
- OT_BITS32: SConstInfo := csiMem32;
- OT_BITS64: SConstInfo := csiMem64;
- else SConstInfo := csiMultiple;
- end;
- if InsTabMemRefSizeInfoCache^[AsmOp].ConstSize = csiUnkown then
- begin
- InsTabMemRefSizeInfoCache^[AsmOp].ConstSize := SConstInfo;
- end
- else if InsTabMemRefSizeInfoCache^[AsmOp].ConstSize <> SConstInfo then
- begin
- InsTabMemRefSizeInfoCache^[AsmOp].ConstSize := csiMultiple;
- end;
- end;
- if actVMemCount > 0 then
- begin
- if actVMemCount = 1 then
- begin
- if actVMemTypes > 0 then
- begin
- case actVMemTypes of
- OT_XMEM32: MRefInfo := msiXMem32;
- OT_XMEM64: MRefInfo := msiXMem64;
- OT_YMEM32: MRefInfo := msiYMem32;
- OT_YMEM64: MRefInfo := msiYMem64;
- else InternalError(777208);
- end;
- case actRegTypes of
- OT_XMMREG: case MRefInfo of
- msiXMem32,
- msiXMem64: RegXMMSizeMask := RegXMMSizeMask or OT_BITS128;
- msiYMem32,
- msiYMem64: RegXMMSizeMask := RegXMMSizeMask or OT_BITS256;
- else InternalError(777210);
- end;
- OT_YMMREG: case MRefInfo of
- msiXMem32,
- msiXMem64: RegYMMSizeMask := RegYMMSizeMask or OT_BITS128;
- msiYMem32,
- msiYMem64: RegYMMSizeMask := RegYMMSizeMask or OT_BITS256;
- else InternalError(777211);
- end;
- //else InternalError(777209);
- end;
- if InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize = msiUnkown then
- begin
- InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := MRefInfo;
- end
- else if InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize <> MRefInfo then
- begin
- if InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize in [msiXMem32, msiXMem64, msiYMem32, msiYMem64] then
- begin
- InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiVMemMultiple;
- end
- else InternalError(777212);
- end;
- end;
- end
- else InternalError(777207);
- end
- else
- case actMemCount of
- 0: ; // nothing todo
- 1: begin
- MRefInfo := msiUnkown;
- case actRegMemTypes and (OT_MMXRM OR OT_XMMRM OR OT_YMMRM) of
- OT_MMXRM: actMemSize := actMemSize or OT_BITS64;
- OT_XMMRM: actMemSize := actMemSize or OT_BITS128;
- OT_YMMRM: actMemSize := actMemSize or OT_BITS256;
- end;
- case actMemSize of
- 0: MRefInfo := msiNoSize;
- OT_BITS8: MRefInfo := msiMem8;
- OT_BITS16: MRefInfo := msiMem16;
- OT_BITS32: MRefInfo := msiMem32;
- OT_BITS64: MRefInfo := msiMem64;
- OT_BITS128: MRefInfo := msiMem128;
- OT_BITS256: MRefInfo := msiMem256;
- OT_BITS80,
- OT_FAR,
- OT_NEAR,
- OT_SHORT: ; // ignore
- else
- begin
- bitcount := bitcnt(actMemSize);
- if bitcount > 1 then MRefInfo := msiMultiple
- else InternalError(777203);
- end;
- end;
- if InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize = msiUnkown then
- begin
- InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := MRefInfo;
- end
- else if InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize <> MRefInfo then
- begin
- with InsTabMemRefSizeInfoCache^[AsmOp] do
- begin
- if ((MemRefSize = msiMem8) OR (MRefInfo = msiMem8)) then MemRefSize := msiMultiple8
- else if ((MemRefSize = msiMem16) OR (MRefInfo = msiMem16)) then MemRefSize := msiMultiple16
- else if ((MemRefSize = msiMem32) OR (MRefInfo = msiMem32)) then MemRefSize := msiMultiple32
- else if ((MemRefSize = msiMem64) OR (MRefInfo = msiMem64)) then MemRefSize := msiMultiple64
- else if ((MemRefSize = msiMem128) OR (MRefInfo = msiMem128)) then MemRefSize := msiMultiple128
- else if ((MemRefSize = msiMem256) OR (MRefInfo = msiMem256)) then MemRefSize := msiMultiple256
- else MemRefSize := msiMultiple;
- end;
- end;
- if actRegCount > 0 then
- begin
- case actRegTypes and (OT_MMXREG or OT_XMMREG or OT_YMMREG) of
- OT_MMXREG: RegMMXSizeMask := RegMMXSizeMask or actMemSize;
- OT_XMMREG: RegXMMSizeMask := RegXMMSizeMask or actMemSize;
- OT_YMMREG: RegYMMSizeMask := RegYMMSizeMask or actMemSize;
- else begin
- RegMMXSizeMask := not(0);
- RegXMMSizeMask := not(0);
- RegYMMSizeMask := not(0);
- end;
- end;
- end;
- end;
- else InternalError(777202);
- end;
- inc(insentry);
- end;
- if (InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize in MemRefMultiples) and
- (InsTabMemRefSizeInfoCache^[AsmOp].ExistsSSEAVX)then
- begin
- case RegXMMSizeMask of
- OT_BITS16: case RegYMMSizeMask of
- OT_BITS32: InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiMemRegx16y32;
- end;
- OT_BITS32: case RegYMMSizeMask of
- OT_BITS64: InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiMemRegx32y64;
- end;
- OT_BITS64: case RegYMMSizeMask of
- OT_BITS128: InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiMemRegx64y128;
- OT_BITS256: InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiMemRegx64y256;
- end;
- OT_BITS128: begin
- if InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize = msiVMemMultiple then
- begin
- // vector-memory-operand AVX2 (e.g. VGATHER..)
- case RegYMMSizeMask of
- OT_BITS256: InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiVMemRegSize;
- end;
- end
- else if RegMMXSizeMask = 0 then
- begin
- case RegYMMSizeMask of
- OT_BITS128: InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiMemRegx64y128;
- OT_BITS256: InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiMemRegSize;
- end;
- end
- else if RegYMMSizeMask = 0 then
- begin
- case RegMMXSizeMask of
- OT_BITS64: InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiMemRegSize;
- end;
- end
- else InternalError(777205);
- end;
- end;
- end;
- end;
- end;
- for AsmOp := low(TAsmOp) to high(TAsmOp) do
- begin
- // only supported intructiones with SSE- or AVX-operands
- if not(InsTabMemRefSizeInfoCache^[AsmOp].ExistsSSEAVX) then
- begin
- InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiUnkown;
- InsTabMemRefSizeInfoCache^[AsmOp].ConstSize := csiUnkown;
- end;
- end;
- end;
- procedure InitAsm;
- begin
- build_spilling_operation_type_table;
- if not assigned(instabcache) then
- BuildInsTabCache;
- if not assigned(InsTabMemRefSizeInfoCache) then
- BuildInsTabMemRefSizeInfoCache;
- end;
- procedure DoneAsm;
- begin
- if assigned(operation_type_table) then
- begin
- dispose(operation_type_table);
- operation_type_table:=nil;
- end;
- if assigned(instabcache) then
- begin
- dispose(instabcache);
- instabcache:=nil;
- end;
- if assigned(InsTabMemRefSizeInfoCache) then
- begin
- dispose(InsTabMemRefSizeInfoCache);
- InsTabMemRefSizeInfoCache:=nil;
- end;
- end;
- begin
- cai_align:=tai_align;
- cai_cpu:=taicpu;
- end.
|