| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274 | {    Copyright (c) 1998-2002 by Florian Klaempfl and Peter Vreman    Contains the abstract assembler implementation for the i386    * Portions of this code was inspired by the NASM sources      The Netwide Assembler is Copyright (c) 1996 Simon Tatham and      Julian Hall. All rights reserved.    This program is free software; you can redistribute it and/or modify    it under the terms of the GNU General Public License as published by    the Free Software Foundation; either version 2 of the License, or    (at your option) any later version.    This program is distributed in the hope that it will be useful,    but WITHOUT ANY WARRANTY; without even the implied warranty of    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the    GNU General Public License for more details.    You should have received a copy of the GNU General Public License    along with this program; if not, write to the Free Software    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. ****************************************************************************}unit aasmcpu;{$i fpcdefs.inc}interface    uses      globtype,verbose,      cpubase,      cgbase,cgutils,      symtype,      aasmbase,aasmtai,aasmdata,aasmsym,      ogbase;    const      { "mov reg,reg" source operand number }      O_MOV_SOURCE = 0;      { "mov reg,reg" destination operand number }      O_MOV_DEST = 1;    { Operand types }      OT_NONE      = $00000000;      { Bits 0..7: sizes }      OT_BITS8     = $00000001;      OT_BITS16    = $00000002;      OT_BITS32    = $00000004;      OT_BITS64    = $00000008;  { x86_64 and FPU }      OT_BITS128   = $10000000;  { 16 byte SSE }      OT_BITS256   = $20000000;  { 32 byte AVX }      OT_BITS80    = $00000010;  { FPU only  }      OT_FAR       = $00000020;  { this means 16:16 or 16:32, like in CALL/JMP }      OT_NEAR      = $00000040;      OT_SHORT     = $00000080;      { TODO: FAR/NEAR/SHORT are sizes too, they should be included into size mask,        but this requires adjusting the opcode table }      OT_SIZE_MASK = $3000001F;  { all the size attributes  }      OT_NON_SIZE  = longint(not OT_SIZE_MASK);      { Bits 8..11: modifiers }      OT_SIGNED    = $00000100;  { the operand need to be signed -128-127 }      OT_TO        = $00000200;  { reverse effect in FADD, FSUB &c  }      OT_COLON     = $00000400;  { operand is followed by a colon  }      OT_MODIFIER_MASK = $00000F00;      { Bits 12..15: type of operand }      OT_REGISTER  = $00001000;      OT_IMMEDIATE = $00002000;      OT_MEMORY    = $0000C000;  { always includes 'OT_REGMEM' bit as well }      OT_REGMEM    = $00008000;  { for r/m, ie EA, operands  }      OT_TYPE_MASK = OT_REGISTER or OT_IMMEDIATE or OT_MEMORY or OT_REGMEM;      OT_REGNORM   = OT_REGISTER or OT_REGMEM;  { 'normal' reg, qualifies as EA  }      { Bits 20..22, 24..26: register classes        otf_* consts are not used alone, only to build other constants. }      otf_reg_cdt  = $00100000;      otf_reg_gpr  = $00200000;      otf_reg_sreg = $00400000;      otf_reg_fpu  = $01000000;      otf_reg_mmx  = $02000000;      otf_reg_xmm  = $04000000;      otf_reg_ymm  = $08000000;      { Bits 16..19: subclasses, meaning depends on classes field }      otf_sub0     = $00010000;      otf_sub1     = $00020000;      otf_sub2     = $00040000;      otf_sub3     = $00080000;      OT_REG_SMASK = otf_sub0 or otf_sub1 or otf_sub2 or otf_sub3;      OT_REG_TYPMASK = otf_reg_cdt or otf_reg_gpr or otf_reg_sreg or otf_reg_fpu or otf_reg_mmx or otf_reg_xmm or otf_reg_ymm;      { register class 0: CRx, DRx and TRx }{$ifdef x86_64}      OT_REG_CDT   = OT_REGISTER or otf_reg_cdt or OT_BITS64;{$else x86_64}      OT_REG_CDT   = OT_REGISTER or otf_reg_cdt or OT_BITS32;{$endif x86_64}      OT_REG_CREG  = OT_REG_CDT or otf_sub0;  { CRn  }      OT_REG_DREG  = OT_REG_CDT or otf_sub1;  { DRn  }      OT_REG_TREG  = OT_REG_CDT or otf_sub2;  { TRn  }      OT_REG_CR4   = OT_REG_CDT or otf_sub3;  { CR4 (Pentium only)  }      { register class 1: general-purpose registers }      OT_REG_GPR   = OT_REGNORM or otf_reg_gpr;      OT_RM_GPR    = OT_REGMEM or otf_reg_gpr;      OT_REG8      = OT_REG_GPR or OT_BITS8;  { 8-bit GPR }      OT_REG16     = OT_REG_GPR or OT_BITS16;      OT_REG32     = OT_REG_GPR or OT_BITS32;      OT_REG64     = OT_REG_GPR or OT_BITS64;      { GPR subclass 0: accumulator: AL, AX, EAX or RAX }      OT_REG_ACCUM = OT_REG_GPR or otf_sub0;      OT_REG_AL    = OT_REG_ACCUM or OT_BITS8;      OT_REG_AX    = OT_REG_ACCUM or OT_BITS16;      OT_REG_EAX   = OT_REG_ACCUM or OT_BITS32;{$ifdef x86_64}      OT_REG_RAX   = OT_REG_ACCUM or OT_BITS64;{$endif x86_64}      { GPR subclass 1: counter: CL, CX, ECX or RCX }      OT_REG_COUNT = OT_REG_GPR or otf_sub1;      OT_REG_CL    = OT_REG_COUNT or OT_BITS8;      OT_REG_CX    = OT_REG_COUNT or OT_BITS16;      OT_REG_ECX   = OT_REG_COUNT or OT_BITS32;{$ifdef x86_64}      OT_REG_RCX   = OT_REG_COUNT or OT_BITS64;{$endif x86_64}      { GPR subclass 2: data register: DL, DX, EDX or RDX }      OT_REG_DX    = OT_REG_GPR or otf_sub2 or OT_BITS16;      OT_REG_EDX   = OT_REG_GPR or otf_sub2 or OT_BITS32;      { register class 2: Segment registers }      OT_REG_SREG  = OT_REGISTER or otf_reg_sreg or OT_BITS16;      OT_REG_CS    = OT_REG_SREG or otf_sub0;  { CS  }      OT_REG_DESS  = OT_REG_SREG or otf_sub1;  { DS, ES, SS (non-CS 86 registers)  }      OT_REG_FSGS  = OT_REG_SREG or otf_sub2;  { FS, GS (386 extended registers)  }      { register class 3: FPU registers }      OT_FPUREG    = OT_REGISTER or otf_reg_fpu;      OT_FPU0      = OT_FPUREG or otf_sub0;    { FPU stack register zero  }      { register class 4: MMX (both reg and r/m) }      OT_MMXREG    = OT_REGNORM or otf_reg_mmx;      OT_MMXRM     = OT_REGMEM or otf_reg_mmx;      { register class 5: XMM (both reg and r/m) }      OT_XMMREG    = OT_REGNORM or otf_reg_xmm;      OT_XMMRM     = OT_REGMEM or otf_reg_xmm;      { register class 5: XMM (both reg and r/m) }      OT_YMMREG    = OT_REGNORM or otf_reg_ymm;      OT_YMMRM     = OT_REGMEM or otf_reg_ymm;      { Memory operands }      OT_MEM8      = OT_MEMORY or OT_BITS8;      OT_MEM16     = OT_MEMORY or OT_BITS16;      OT_MEM32     = OT_MEMORY or OT_BITS32;      OT_MEM64     = OT_MEMORY or OT_BITS64;      OT_MEM128    = OT_MEMORY or OT_BITS128;      OT_MEM256    = OT_MEMORY or OT_BITS256;      OT_MEM80     = OT_MEMORY or OT_BITS80;      OT_MEM_OFFS  = OT_MEMORY or otf_sub0;  { special type of EA  }                                             { simple [address] offset  }      { Matches any type of r/m operand }      OT_MEMORY_ANY = OT_MEMORY or OT_RM_GPR or OT_XMMRM or OT_MMXRM or OT_YMMRM;      { Immediate operands }      OT_IMM8      = OT_IMMEDIATE or OT_BITS8;      OT_IMM16     = OT_IMMEDIATE or OT_BITS16;      OT_IMM32     = OT_IMMEDIATE or OT_BITS32;      OT_IMM64     = OT_IMMEDIATE or OT_BITS64;      OT_ONENESS   = otf_sub0;  { special type of immediate operand  }      OT_UNITY     = OT_IMMEDIATE or OT_ONENESS;  { for shift/rotate instructions  }      { Size of the instruction table converted by nasmconv.pas }{$ifdef x86_64}      instabentries = {$i x8664nop.inc}{$else x86_64}      instabentries = {$i i386nop.inc}{$endif x86_64}      maxinfolen    = 8;      MaxInsChanges = 3; { Max things a instruction can change }    type      { What an instruction can change. Needed for optimizer and spilling code.        Note: The order of this enumeration is should not be changed! }      TInsChange = (Ch_None,        {Read from a register}        Ch_REAX, Ch_RECX, Ch_REDX, Ch_REBX, Ch_RESP, Ch_REBP, Ch_RESI, Ch_REDI,        {write from a register}        Ch_WEAX, Ch_WECX, Ch_WEDX, Ch_WEBX, Ch_WESP, Ch_WEBP, Ch_WESI, Ch_WEDI,        {read and write from/to a register}        Ch_RWEAX, Ch_RWECX, Ch_RWEDX, Ch_RWEBX, Ch_RWESP, Ch_RWEBP, Ch_RWESI, Ch_RWEDI,        {modify the contents of a register with the purpose of using         this changed content afterwards (add/sub/..., but e.g. not rep         or movsd)}        Ch_MEAX, Ch_MECX, Ch_MEDX, Ch_MEBX, Ch_MESP, Ch_MEBP, Ch_MESI, Ch_MEDI,        Ch_CDirFlag {clear direction flag}, Ch_SDirFlag {set dir flag},        Ch_RFlags, Ch_WFlags, Ch_RWFlags, Ch_FPU,        Ch_Rop1, Ch_Wop1, Ch_RWop1,Ch_Mop1,        Ch_Rop2, Ch_Wop2, Ch_RWop2,Ch_Mop2,        Ch_Rop3, Ch_WOp3, Ch_RWOp3,Ch_Mop3,        Ch_WMemEDI,        Ch_All,        { x86_64 registers }        Ch_RRAX, Ch_RRCX, Ch_RRDX, Ch_RRBX, Ch_RRSP, Ch_RRBP, Ch_RRSI, Ch_RRDI,        Ch_WRAX, Ch_WRCX, Ch_WRDX, Ch_WRBX, Ch_WRSP, Ch_WRBP, Ch_WRSI, Ch_WRDI,        Ch_RWRAX, Ch_RWRCX, Ch_RWRDX, Ch_RWRBX, Ch_RWRSP, Ch_RWRBP, Ch_RWRSI, Ch_RWRDI,        Ch_MRAX, Ch_MRCX, Ch_MRDX, Ch_MRBX, Ch_MRSP, Ch_MRBP, Ch_MRSI, Ch_MRDI      );      TInsProp = packed record        Ch : Array[1..MaxInsChanges] of TInsChange;      end;      TMemRefSizeInfo = (msiUnkown, msiUnsupported, msiNoSize,                         msiMultiple, msiMultiple8, msiMultiple16, msiMultiple32,                         msiMultiple64, msiMultiple128, msiMultiple256,                         msiMemRegSize, msiMemRegx64y128, msiMemRegx64y256,                         msiMem8, msiMem16, msiMem32, msiMem64, msiMem128, msiMem256);      TConstSizeInfo  = (csiUnkown, csiMultiple, csiNoSize, csiMem8, csiMem16, csiMem32, csiMem64);      TInsTabMemRefSizeInfoRec = record        MemRefSize  : TMemRefSizeInfo;        ExistsSSEAVX: boolean;        ConstSize   : TConstSizeInfo;      end;    const      MemRefMultiples: set of TMemRefSizeInfo = [msiMultiple, msiMultiple8,                                                 msiMultiple16, msiMultiple32,                                                 msiMultiple64, msiMultiple128,                                                 msiMultiple256];      InsProp : array[tasmop] of TInsProp ={$ifdef x86_64}        {$i x8664pro.inc}{$else x86_64}        {$i i386prop.inc}{$endif x86_64}    type      TOperandOrder = (op_intel,op_att);      tinsentry=packed record        opcode  : tasmop;        ops     : byte;        optypes : array[0..max_operands-1] of longint;        code    : array[0..maxinfolen] of char;        flags   : int64;      end;      pinsentry=^tinsentry;      { alignment for operator }      tai_align = class(tai_align_abstract)         reg       : tregister;         constructor create(b:byte);override;         constructor create_op(b: byte; _op: byte);override;         function calculatefillbuf(var buf : tfillbuffer;executable : boolean):pchar;override;      end;      taicpu = class(tai_cpu_abstract_sym)         opsize    : topsize;         constructor op_none(op : tasmop);         constructor op_none(op : tasmop;_size : topsize);         constructor op_reg(op : tasmop;_size : topsize;_op1 : tregister);         constructor op_const(op : tasmop;_size : topsize;_op1 : aint);         constructor op_ref(op : tasmop;_size : topsize;const _op1 : treference);         constructor op_reg_reg(op : tasmop;_size : topsize;_op1,_op2 : tregister);         constructor op_reg_ref(op : tasmop;_size : topsize;_op1 : tregister;const _op2 : treference);         constructor op_reg_const(op:tasmop; _size: topsize; _op1: tregister; _op2: aint);         constructor op_const_reg(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister);         constructor op_const_const(op : tasmop;_size : topsize;_op1,_op2 : aint);         constructor op_const_ref(op : tasmop;_size : topsize;_op1 : aint;const _op2 : treference);         constructor op_ref_reg(op : tasmop;_size : topsize;const _op1 : treference;_op2 : tregister);         constructor op_reg_reg_reg(op : tasmop;_size : topsize;_op1,_op2,_op3 : tregister);         constructor op_const_reg_reg(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister;_op3 : tregister);         constructor op_const_ref_reg(op : tasmop;_size : topsize;_op1 : aint;const _op2 : treference;_op3 : tregister);         constructor op_reg_reg_ref(op : tasmop;_size : topsize;_op1,_op2 : tregister; const _op3 : treference);         constructor op_const_reg_ref(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister;const _op3 : treference);         { this is for Jmp instructions }         constructor op_cond_sym(op : tasmop;cond:TAsmCond;_size : topsize;_op1 : tasmsymbol);         constructor op_sym(op : tasmop;_size : topsize;_op1 : tasmsymbol);         constructor op_sym_ofs(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint);         constructor op_sym_ofs_reg(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint;_op2 : tregister);         constructor op_sym_ofs_ref(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint;const _op2 : treference);         procedure changeopsize(siz:topsize);         function  GetString:string;         procedure CheckNonCommutativeOpcodes;      private         FOperandOrder : TOperandOrder;         procedure init(_size : topsize); { this need to be called by all constructor }      public         { the next will reset all instructions that can change in pass 2 }         procedure ResetPass1;override;         procedure ResetPass2;override;         function  CheckIfValid:boolean;         function  Pass1(objdata:TObjData):longint;override;         procedure Pass2(objdata:TObjData);override;         procedure SetOperandOrder(order:TOperandOrder);         function is_same_reg_move(regtype: Tregistertype):boolean;override;         { register spilling code }         function spilling_get_operation_type(opnr: longint): topertype;override;      private         { next fields are filled in pass1, so pass2 is faster }         insentry  : PInsEntry;         insoffset : longint;         LastInsOffset : longint; { need to be public to be reset }         inssize   : shortint;{$ifdef x86_64}         rex       : byte;{$endif x86_64}         function  InsEnd:longint;         procedure create_ot(objdata:TObjData);         function  Matches(p:PInsEntry):boolean;         function  calcsize(p:PInsEntry):shortint;         procedure gencode(objdata:TObjData);         function  NeedAddrPrefix(opidx:byte):boolean;         procedure Swapoperands;         function  FindInsentry(objdata:TObjData):boolean;      end;    function spilling_create_load(const ref:treference;r:tregister):Taicpu;    function spilling_create_store(r:tregister; const ref:treference):Taicpu;    function MemRefInfo(aAsmop: TAsmOp): TInsTabMemRefSizeInfoRec;    procedure InitAsm;    procedure DoneAsm;implementation     uses       cutils,       globals,       systems,       procinfo,       itcpugas,       symsym;{*****************************************************************************                              Instruction table*****************************************************************************}    const     {Instruction flags }       IF_NONE   = $00000000;       IF_SM     = $00000001;  { size match first two operands  }       IF_SM2    = $00000002;       IF_SB     = $00000004;  { unsized operands can't be non-byte  }       IF_SW     = $00000008;  { unsized operands can't be non-word  }       IF_SD     = $00000010;  { unsized operands can't be nondword  }       IF_SMASK  = $0000001f;       IF_AR0    = $00000020;  { SB, SW, SD applies to argument 0  }       IF_AR1    = $00000040;  { SB, SW, SD applies to argument 1  }       IF_AR2    = $00000060;  { SB, SW, SD applies to argument 2  }       IF_ARMASK = $00000060;  { mask for unsized argument spec  }       IF_ARSHIFT = 5;         { LSB of IF_ARMASK }       IF_PRIV   = $00000100;  { it's a privileged instruction  }       IF_SMM    = $00000200;  { it's only valid in SMM  }       IF_PROT   = $00000400;  { it's protected mode only  }       IF_NOX86_64 = $00000800;  { removed instruction in x86_64  }       IF_UNDOC  = $00001000;  { it's an undocumented instruction  }       IF_FPU    = $00002000;  { it's an FPU instruction  }       IF_MMX    = $00004000;  { it's an MMX instruction  }       { it's a 3DNow! instruction  }       IF_3DNOW  = $00008000;       { it's a SSE (KNI, MMX2) instruction  }       IF_SSE    = $00010000;       { SSE2 instructions  }       IF_SSE2   = $00020000;       { SSE3 instructions  }       IF_SSE3   = $00040000;       { SSE64 instructions  }       IF_SSE64  = $00080000;       { the mask for processor types  }       {IF_PMASK  = longint($FF000000);}       { the mask for disassembly "prefer"  }       {IF_PFMASK = longint($F001FF00);}       { SVM instructions  }       IF_SVM    = $00100000;       { SSE4 instructions  }       IF_SSE4   = $00200000;       { TODO: These flags were added to make x86ins.dat more readable.         Values must be reassigned to make any other use of them. }       IF_SSSE3  = $00200000;       IF_SSE41  = $00200000;       IF_SSE42  = $00200000;       IF_AVX    = $00200000;       IF_SANDYBRIDGE = $00200000;       IF_8086   = $00000000;  { 8086 instruction  }       IF_186    = $01000000;  { 186+ instruction  }       IF_286    = $02000000;  { 286+ instruction  }       IF_386    = $03000000;  { 386+ instruction  }       IF_486    = $04000000;  { 486+ instruction  }       IF_PENT   = $05000000;  { Pentium instruction  }       IF_P6     = $06000000;  { P6 instruction  }       IF_KATMAI = $07000000;  { Katmai instructions  }       { Willamette instructions }       IF_WILLAMETTE = $08000000;       { Prescott instructions }       IF_PRESCOTT = $09000000;       IF_X86_64 = $0a000000;       IF_CYRIX  = $0b000000;  { Cyrix-specific instruction  }       IF_AMD    = $0c000000;  { AMD-specific instruction  }       IF_CENTAUR = $0d000000;  { centaur-specific instruction  }       { added flags }       IF_PRE    = $40000000;  { it's a prefix instruction }       IF_PASS2  = $80000000;  { if the instruction can change in a second pass }     type       TInsTabCache=array[TasmOp] of longint;       PInsTabCache=^TInsTabCache;       TInsTabMemRefSizeInfoCache=array[TasmOp] of TInsTabMemRefSizeInfoRec;       PInsTabMemRefSizeInfoCache=^TInsTabMemRefSizeInfoCache;     const{$ifdef x86_64}       InsTab:array[0..instabentries-1] of TInsEntry={$i x8664tab.inc}{$else x86_64}       InsTab:array[0..instabentries-1] of TInsEntry={$i i386tab.inc}{$endif x86_64}     var       InsTabCache : PInsTabCache;       InsTabMemRefSizeInfoCache: PInsTabMemRefSizeInfoCache;     const{$ifdef x86_64}       { Intel style operands ! }       opsize_2_type:array[0..2,topsize] of longint=(         (OT_NONE,          OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS16,OT_BITS32,OT_BITS32,OT_BITS64,OT_BITS64,OT_BITS64,          OT_BITS16,OT_BITS32,OT_BITS64,          OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,          OT_BITS64,          OT_NEAR,OT_FAR,OT_SHORT,          OT_NONE,          OT_BITS128,          OT_BITS256         ),         (OT_NONE,          OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS8,OT_BITS8,OT_BITS16,OT_BITS8,OT_BITS16,OT_BITS32,          OT_BITS16,OT_BITS32,OT_BITS64,          OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,          OT_BITS64,          OT_NEAR,OT_FAR,OT_SHORT,          OT_NONE,          OT_BITS128,          OT_BITS256         ),         (OT_NONE,          OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_NONE,OT_NONE,OT_NONE,OT_NONE,OT_NONE,OT_NONE,          OT_BITS16,OT_BITS32,OT_BITS64,          OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,          OT_BITS64,          OT_NEAR,OT_FAR,OT_SHORT,          OT_NONE,          OT_BITS128,          OT_BITS256         )       );      reg_ot_table : array[tregisterindex] of longint = (        {$i r8664ot.inc}      );{$else x86_64}       { Intel style operands ! }       opsize_2_type:array[0..2,topsize] of longint=(         (OT_NONE,          OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS16,OT_BITS32,OT_BITS32,          OT_BITS16,OT_BITS32,OT_BITS64,          OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,          OT_BITS64,          OT_NEAR,OT_FAR,OT_SHORT,          OT_NONE,          OT_BITS128,          OT_BITS256         ),         (OT_NONE,          OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS8,OT_BITS8,OT_BITS16,          OT_BITS16,OT_BITS32,OT_BITS64,          OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,          OT_BITS64,          OT_NEAR,OT_FAR,OT_SHORT,          OT_NONE,          OT_BITS128,          OT_BITS256         ),         (OT_NONE,          OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_NONE,OT_NONE,OT_NONE,          OT_BITS16,OT_BITS32,OT_BITS64,          OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,          OT_BITS64,          OT_NEAR,OT_FAR,OT_SHORT,          OT_NONE,          OT_BITS128,          OT_BITS256         )      );      reg_ot_table : array[tregisterindex] of longint = (        {$i r386ot.inc}      );{$endif x86_64}    function MemRefInfo(aAsmop: TAsmOp): TInsTabMemRefSizeInfoRec;    begin      result := InsTabMemRefSizeInfoCache^[aAsmop];    end;    { Operation type for spilling code }    type      toperation_type_table=array[tasmop,0..Max_Operands] of topertype;    var      operation_type_table : ^toperation_type_table;{****************************************************************************                              TAI_ALIGN ****************************************************************************}    constructor tai_align.create(b: byte);      begin        inherited create(b);        reg:=NR_ECX;      end;    constructor tai_align.create_op(b: byte; _op: byte);      begin        inherited create_op(b,_op);        reg:=NR_NO;      end;    function tai_align.calculatefillbuf(var buf : tfillbuffer;executable : boolean):pchar;      const{$ifdef x86_64}        alignarray:array[0..3] of string[4]=(          #$66#$66#$66#$90,          #$66#$66#$90,          #$66#$90,          #$90        );{$else x86_64}        alignarray:array[0..5] of string[8]=(          #$8D#$B4#$26#$00#$00#$00#$00,          #$8D#$B6#$00#$00#$00#$00,          #$8D#$74#$26#$00,          #$8D#$76#$00,          #$89#$F6,          #$90);{$endif x86_64}      var        bufptr : pchar;        j : longint;        localsize: byte;      begin        inherited calculatefillbuf(buf,executable);        if not(use_op) and executable then         begin           bufptr:=pchar(@buf);           { fillsize may still be used afterwards, so don't modify }           { e.g. writebytes(hp.calculatefillbuf(buf)^,hp.fillsize) }           localsize:=fillsize;           while (localsize>0) do            begin              for j:=low(alignarray) to high(alignarray) do               if (localsize>=length(alignarray[j])) then                break;              move(alignarray[j][1],bufptr^,length(alignarray[j]));              inc(bufptr,length(alignarray[j]));              dec(localsize,length(alignarray[j]));            end;         end;        calculatefillbuf:=pchar(@buf);      end;{*****************************************************************************                                 Taicpu Constructors*****************************************************************************}    procedure taicpu.changeopsize(siz:topsize);      begin        opsize:=siz;      end;    procedure taicpu.init(_size : topsize);      begin         { default order is att }         FOperandOrder:=op_att;         segprefix:=NR_NO;         opsize:=_size;         insentry:=nil;         LastInsOffset:=-1;         InsOffset:=0;         InsSize:=0;      end;    constructor taicpu.op_none(op : tasmop);      begin         inherited create(op);         init(S_NO);      end;    constructor taicpu.op_none(op : tasmop;_size : topsize);      begin         inherited create(op);         init(_size);      end;    constructor taicpu.op_reg(op : tasmop;_size : topsize;_op1 : tregister);      begin         inherited create(op);         init(_size);         ops:=1;         loadreg(0,_op1);      end;    constructor taicpu.op_const(op : tasmop;_size : topsize;_op1 : aint);      begin         inherited create(op);         init(_size);         ops:=1;         loadconst(0,_op1);      end;    constructor taicpu.op_ref(op : tasmop;_size : topsize;const _op1 : treference);      begin         inherited create(op);         init(_size);         ops:=1;         loadref(0,_op1);      end;    constructor taicpu.op_reg_reg(op : tasmop;_size : topsize;_op1,_op2 : tregister);      begin         inherited create(op);         init(_size);         ops:=2;         loadreg(0,_op1);         loadreg(1,_op2);      end;    constructor taicpu.op_reg_const(op:tasmop; _size: topsize; _op1: tregister; _op2: aint);      begin         inherited create(op);         init(_size);         ops:=2;         loadreg(0,_op1);         loadconst(1,_op2);      end;    constructor taicpu.op_reg_ref(op : tasmop;_size : topsize;_op1 : tregister;const _op2 : treference);      begin         inherited create(op);         init(_size);         ops:=2;         loadreg(0,_op1);         loadref(1,_op2);      end;    constructor taicpu.op_const_reg(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister);      begin         inherited create(op);         init(_size);         ops:=2;         loadconst(0,_op1);         loadreg(1,_op2);      end;    constructor taicpu.op_const_const(op : tasmop;_size : topsize;_op1,_op2 : aint);      begin         inherited create(op);         init(_size);         ops:=2;         loadconst(0,_op1);         loadconst(1,_op2);      end;    constructor taicpu.op_const_ref(op : tasmop;_size : topsize;_op1 : aint;const _op2 : treference);      begin         inherited create(op);         init(_size);         ops:=2;         loadconst(0,_op1);         loadref(1,_op2);      end;    constructor taicpu.op_ref_reg(op : tasmop;_size : topsize;const _op1 : treference;_op2 : tregister);      begin         inherited create(op);         init(_size);         ops:=2;         loadref(0,_op1);         loadreg(1,_op2);      end;    constructor taicpu.op_reg_reg_reg(op : tasmop;_size : topsize;_op1,_op2,_op3 : tregister);      begin         inherited create(op);         init(_size);         ops:=3;         loadreg(0,_op1);         loadreg(1,_op2);         loadreg(2,_op3);      end;    constructor taicpu.op_const_reg_reg(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister;_op3 : tregister);      begin         inherited create(op);         init(_size);         ops:=3;         loadconst(0,_op1);         loadreg(1,_op2);         loadreg(2,_op3);      end;    constructor taicpu.op_reg_reg_ref(op : tasmop;_size : topsize;_op1,_op2 : tregister;const _op3 : treference);      begin         inherited create(op);         init(_size);         ops:=3;         loadreg(0,_op1);         loadreg(1,_op2);         loadref(2,_op3);      end;    constructor taicpu.op_const_ref_reg(op : tasmop;_size : topsize;_op1 : aint;const _op2 : treference;_op3 : tregister);      begin         inherited create(op);         init(_size);         ops:=3;         loadconst(0,_op1);         loadref(1,_op2);         loadreg(2,_op3);      end;    constructor taicpu.op_const_reg_ref(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister;const _op3 : treference);      begin         inherited create(op);         init(_size);         ops:=3;         loadconst(0,_op1);         loadreg(1,_op2);         loadref(2,_op3);      end;    constructor taicpu.op_cond_sym(op : tasmop;cond:TAsmCond;_size : topsize;_op1 : tasmsymbol);      begin         inherited create(op);         init(_size);         condition:=cond;         ops:=1;         loadsymbol(0,_op1,0);      end;    constructor taicpu.op_sym(op : tasmop;_size : topsize;_op1 : tasmsymbol);      begin         inherited create(op);         init(_size);         ops:=1;         loadsymbol(0,_op1,0);      end;    constructor taicpu.op_sym_ofs(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint);      begin         inherited create(op);         init(_size);         ops:=1;         loadsymbol(0,_op1,_op1ofs);      end;    constructor taicpu.op_sym_ofs_reg(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint;_op2 : tregister);      begin         inherited create(op);         init(_size);         ops:=2;         loadsymbol(0,_op1,_op1ofs);         loadreg(1,_op2);      end;    constructor taicpu.op_sym_ofs_ref(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint;const _op2 : treference);      begin         inherited create(op);         init(_size);         ops:=2;         loadsymbol(0,_op1,_op1ofs);         loadref(1,_op2);      end;    function taicpu.GetString:string;      var        i : longint;        s : string;        addsize : boolean;      begin        s:='['+std_op2str[opcode];        for i:=0 to ops-1 do         begin           with oper[i]^ do             begin               if i=0 then                s:=s+' '               else                s:=s+',';               { type }               addsize:=false;               if (ot and OT_XMMREG)=OT_XMMREG then                s:=s+'xmmreg'               else                 if (ot and OT_YMMREG)=OT_YMMREG then                  s:=s+'ymmreg'               else                 if (ot and OT_MMXREG)=OT_MMXREG then                  s:=s+'mmxreg'               else                 if (ot and OT_FPUREG)=OT_FPUREG then                  s:=s+'fpureg'               else                if (ot and OT_REGISTER)=OT_REGISTER then                 begin                   s:=s+'reg';                   addsize:=true;                 end               else                if (ot and OT_IMMEDIATE)=OT_IMMEDIATE then                 begin                   s:=s+'imm';                   addsize:=true;                 end               else                if (ot and OT_MEMORY)=OT_MEMORY then                 begin                   s:=s+'mem';                   addsize:=true;                 end               else                 s:=s+'???';               { size }               if addsize then                begin                  if (ot and OT_BITS8)<>0 then                    s:=s+'8'                  else                   if (ot and OT_BITS16)<>0 then                    s:=s+'16'                  else                   if (ot and OT_BITS32)<>0 then                    s:=s+'32'                  else                   if (ot and OT_BITS64)<>0 then                    s:=s+'64'                  else                   if (ot and OT_BITS128)<>0 then                    s:=s+'128'                  else                   if (ot and OT_BITS256)<>0 then                    s:=s+'256'                  else                    s:=s+'??';                  { signed }                  if (ot and OT_SIGNED)<>0 then                   s:=s+'s';                end;             end;         end;        GetString:=s+']';      end;    procedure taicpu.Swapoperands;      var        p : POper;      begin        { Fix the operands which are in AT&T style and we need them in Intel style }        case ops of          0,1:            ;          2 : begin                { 0,1 -> 1,0 }                p:=oper[0];                oper[0]:=oper[1];                oper[1]:=p;              end;          3 : begin                { 0,1,2 -> 2,1,0 }                p:=oper[0];                oper[0]:=oper[2];                oper[2]:=p;              end;          4 : begin                { 0,1,2,3 -> 3,2,1,0 }                p:=oper[0];                oper[0]:=oper[3];                oper[3]:=p;                p:=oper[1];                oper[1]:=oper[2];                oper[2]:=p;              end;          else            internalerror(201108141);        end;      end;    procedure taicpu.SetOperandOrder(order:TOperandOrder);      begin        if FOperandOrder<>order then         begin           Swapoperands;           FOperandOrder:=order;         end;      end;    procedure taicpu.CheckNonCommutativeOpcodes;      begin        { we need ATT order }        SetOperandOrder(op_att);        if (            (ops=2) and            (oper[0]^.typ=top_reg) and            (oper[1]^.typ=top_reg) and           { if the first is ST and the second is also a register             it is necessarily ST1 .. ST7 }            ((oper[0]^.reg=NR_ST) or             (oper[0]^.reg=NR_ST0))           ) or           { ((ops=1) and            (oper[0]^.typ=top_reg) and            (oper[0]^.reg in [R_ST1..R_ST7]))  or}           (ops=0) then          begin            if opcode=A_FSUBR then              opcode:=A_FSUB            else if opcode=A_FSUB then              opcode:=A_FSUBR            else if opcode=A_FDIVR then              opcode:=A_FDIV            else if opcode=A_FDIV then              opcode:=A_FDIVR            else if opcode=A_FSUBRP then              opcode:=A_FSUBP            else if opcode=A_FSUBP then              opcode:=A_FSUBRP            else if opcode=A_FDIVRP then              opcode:=A_FDIVP            else if opcode=A_FDIVP then              opcode:=A_FDIVRP;          end;        if (            (ops=1) and            (oper[0]^.typ=top_reg) and            (getregtype(oper[0]^.reg)=R_FPUREGISTER) and            (oper[0]^.reg<>NR_ST)           ) then         begin           if opcode=A_FSUBRP then             opcode:=A_FSUBP           else if opcode=A_FSUBP then             opcode:=A_FSUBRP           else if opcode=A_FDIVRP then             opcode:=A_FDIVP           else if opcode=A_FDIVP then             opcode:=A_FDIVRP;         end;      end;{*****************************************************************************                                Assembler*****************************************************************************}    type      ea = packed record        sib_present : boolean;        bytes : byte;        size  : byte;        modrm : byte;        sib   : byte;{$ifdef x86_64}        rex   : byte;{$endif x86_64}      end;    procedure taicpu.create_ot(objdata:TObjData);      {        this function will also fix some other fields which only needs to be once      }      var        i,l,relsize : longint;        currsym : TObjSymbol;      begin        if ops=0 then         exit;        { update oper[].ot field }        for i:=0 to ops-1 do         with oper[i]^ do          begin            case typ of              top_reg :                begin                  ot:=reg_ot_table[findreg_by_number(reg)];                end;              top_ref :                begin                  if (ref^.refaddr=addr_no){$ifdef i386}                     or (                         (ref^.refaddr in [addr_pic]) and                         { allow any base for assembler blocks }                        ((assigned(current_procinfo) and                         (pi_has_assembler_block in current_procinfo.flags) and                         (ref^.base<>NR_NO)) or (ref^.base=NR_EBX))                        ){$endif i386}{$ifdef x86_64}                     or (                         (ref^.refaddr in [addr_pic,addr_pic_no_got]) and                         (ref^.base<>NR_NO)                        ){$endif x86_64}                     then                    begin                      { create ot field }                      if (ot and OT_SIZE_MASK)=0 then                        ot:=OT_MEMORY_ANY or opsize_2_type[i,opsize]                      else                        ot:=OT_MEMORY_ANY or (ot and OT_SIZE_MASK);                      if (ref^.base=NR_NO) and (ref^.index=NR_NO) then                        ot:=ot or OT_MEM_OFFS;                      { fix scalefactor }                      if (ref^.index=NR_NO) then                       ref^.scalefactor:=0                      else                       if (ref^.scalefactor=0) then                        ref^.scalefactor:=1;                    end                  else                    begin                      { Jumps use a relative offset which can be 8bit,                        for other opcodes we always need to generate the full                        32bit address }                      if assigned(objdata) and                         is_jmp then                        begin                          currsym:=objdata.symbolref(ref^.symbol);                          l:=ref^.offset;{$push}{$r-}                          if assigned(currsym) then                            inc(l,currsym.address);{$pop}                          { when it is a forward jump we need to compensate the                            offset of the instruction since the previous time,                            because the symbol address is then still using the                            'old-style' addressing.                            For backwards jumps this is not required because the                            address of the symbol is already adjusted to the                            new offset }                          if (l>InsOffset) and (LastInsOffset<>-1) then                            inc(l,InsOffset-LastInsOffset);                          { instruction size will then always become 2 (PFV) }                          relsize:=(InsOffset+2)-l;                          if (relsize>=-128) and (relsize<=127) and                             (                              not assigned(currsym) or                              (currsym.objsection=objdata.currobjsec)                             ) then                            ot:=OT_IMM8 or OT_SHORT                          else                            ot:=OT_IMM32 or OT_NEAR;                        end                      else                        ot:=OT_IMM32 or OT_NEAR;                    end;                end;              top_local :                begin                  if (ot and OT_SIZE_MASK)=0 then                    ot:=OT_MEMORY or opsize_2_type[i,opsize]                  else                    ot:=OT_MEMORY or (ot and OT_SIZE_MASK);                end;              top_const :                begin                  // if opcode is a SSE or AVX-instruction then we need a                  // special handling (opsize can different from const-size)                  // (e.g. "pextrw  reg/m16, xmmreg, imm8" =>> opsize (16 bit), const-size (8 bit)                  if (InsTabMemRefSizeInfoCache^[opcode].ExistsSSEAVX) and                     (not(InsTabMemRefSizeInfoCache^[opcode].ConstSize in [csiMultiple, csiUnkown])) then                  begin                    case InsTabMemRefSizeInfoCache^[opcode].ConstSize of                      csiNoSize: ot := ot and (not(OT_SIZE_MASK)) or OT_IMMEDIATE;                        csiMem8: ot := ot and (not(OT_SIZE_MASK)) or OT_IMMEDIATE or OT_BITS8;                       csiMem16: ot := ot and (not(OT_SIZE_MASK)) or OT_IMMEDIATE or OT_BITS16;                       csiMem32: ot := ot and (not(OT_SIZE_MASK)) or OT_IMMEDIATE or OT_BITS32;                       csiMem64: ot := ot and (not(OT_SIZE_MASK)) or OT_IMMEDIATE or OT_BITS64;                    end;                  end                  else                  begin                    { allow 2nd, 3rd or 4th operand being a constant and expect no size for shuf* etc. }                    { further, allow AAD and AAM with imm. operand }                    if (opsize=S_NO) and not((i in [1,2,3]) or ((i=0) and (opcode in [A_AAD,A_AAM]))) then                      message(asmr_e_invalid_opcode_and_operand);                    if (opsize<>S_W) and (aint(val)>=-128) and (val<=127) then                      ot:=OT_IMM8 or OT_SIGNED                    else                      ot:=OT_IMMEDIATE or opsize_2_type[i,opsize];                    if (val=1) and (i=1) then                      ot := ot or OT_ONENESS;                  end;                end;              top_none :                begin                  { generated when there was an error in the                    assembler reader. It never happends when generating                    assembler }                end;              else                internalerror(200402261);            end;          end;      end;    function taicpu.InsEnd:longint;      begin        InsEnd:=InsOffset+InsSize;      end;      function taicpu.Matches(p:PInsEntry):boolean;      { * IF_SM stands for Size Match: any operand whose size is not       * explicitly specified by the template is `really' intended to be       * the same size as the first size-specified operand.       * Non-specification is tolerated in the input instruction, but       * _wrong_ specification is not.       *       * IF_SM2 invokes Size Match on only the first _two_ operands, for       * three-operand instructions such as SHLD: it implies that the       * first two operands must match in size, but that the third is       * required to be _unspecified_.       *       * IF_SB invokes Size Byte: operands with unspecified size in the       * template are really bytes, and so no non-byte specification in       * the input instruction will be tolerated. IF_SW similarly invokes       * Size Word, and IF_SD invokes Size Doubleword.       *       * (The default state if neither IF_SM nor IF_SM2 is specified is       * that any operand with unspecified size in the template is       * required to have unspecified size in the instruction too...)      }      var        insot,        currot,        i,j,asize,oprs : longint;        insflags:cardinal;        siz : array[0..max_operands-1] of longint;      begin        result:=false;        { Check the opcode and operands }        if (p^.opcode<>opcode) or (p^.ops<>ops) then          exit;        for i:=0 to p^.ops-1 do         begin           insot:=p^.optypes[i];           currot:=oper[i]^.ot;           { Check the operand flags }           if (insot and (not currot) and OT_NON_SIZE)<>0 then             exit;           { Check if the passed operand size matches with one of             the supported operand sizes }           if ((insot and OT_SIZE_MASK)<>0) and              ((insot and currot and OT_SIZE_MASK)<>(currot and OT_SIZE_MASK)) then             exit;         end;        { Check operand sizes }        insflags:=p^.flags;        if insflags and IF_SMASK<>0 then          begin            { as default an untyped size can get all the sizes, this is different              from nasm, but else we need to do a lot checking which opcodes want              size or not with the automatic size generation }            asize:=-1;            if (insflags and IF_SB)<>0 then              asize:=OT_BITS8            else if (insflags and IF_SW)<>0 then              asize:=OT_BITS16            else if (insflags and IF_SD)<>0 then              asize:=OT_BITS32;            if (insflags and IF_ARMASK)<>0 then             begin               siz[0]:=-1;               siz[1]:=-1;               siz[2]:=-1;               siz[((insflags and IF_ARMASK) shr IF_ARSHIFT)-1]:=asize;             end            else             begin               siz[0]:=asize;               siz[1]:=asize;               siz[2]:=asize;             end;            if (insflags and (IF_SM or IF_SM2))<>0 then             begin               if (insflags and IF_SM2)<>0 then                oprs:=2               else                oprs:=p^.ops;               for i:=0 to oprs-1 do                if ((p^.optypes[i] and OT_SIZE_MASK) <> 0) then                 begin                   for j:=0 to oprs-1 do                    siz[j]:=p^.optypes[i] and OT_SIZE_MASK;                   break;                 end;              end             else              oprs:=2;            { Check operand sizes }            for i:=0 to p^.ops-1 do              begin                insot:=p^.optypes[i];                currot:=oper[i]^.ot;                if ((insot and OT_SIZE_MASK)=0) and                   ((currot and OT_SIZE_MASK and (not siz[i]))<>0) and                   { Immediates can always include smaller size }                   ((currot and OT_IMMEDIATE)=0) and                    (((insot and OT_SIZE_MASK) or siz[i])<(currot and OT_SIZE_MASK)) then                  exit;              end;          end;        if (InsTabMemRefSizeInfoCache^[opcode].MemRefSize in MemRefMultiples) and           (InsTabMemRefSizeInfoCache^[opcode].ExistsSSEAVX) then        begin          for i:=0 to p^.ops-1 do           begin             insot:=p^.optypes[i];             if ((insot and OT_XMMRM) = OT_XMMRM) OR                ((insot and OT_YMMRM) = OT_YMMRM) then             begin               if (insot and OT_SIZE_MASK) = 0 then               begin                 case insot and (OT_XMMRM or OT_YMMRM) of                   OT_XMMRM: insot := insot or OT_BITS128;                   OT_YMMRM: insot := insot or OT_BITS256;                 end;               end;             end;             currot:=oper[i]^.ot;             { Check the operand flags }             if (insot and (not currot) and OT_NON_SIZE)<>0 then               exit;             { Check if the passed operand size matches with one of               the supported operand sizes }             if ((insot and OT_SIZE_MASK)<>0) and                ((insot and currot and OT_SIZE_MASK)<>(currot and OT_SIZE_MASK)) then               exit;           end;        end;        result:=true;      end;    procedure taicpu.ResetPass1;      begin        { we need to reset everything here, because the choosen insentry          can be invalid for a new situation where the previously optimized          insentry is not correct }        InsEntry:=nil;        InsSize:=0;        LastInsOffset:=-1;      end;    procedure taicpu.ResetPass2;      begin        { we are here in a second pass, check if the instruction can be optimized }        if assigned(InsEntry) and           ((InsEntry^.flags and IF_PASS2)<>0) then         begin           InsEntry:=nil;           InsSize:=0;         end;        LastInsOffset:=-1;      end;    function taicpu.CheckIfValid:boolean;      begin        result:=FindInsEntry(nil);      end;    function taicpu.FindInsentry(objdata:TObjData):boolean;      var        i : longint;      begin        result:=false;      { Things which may only be done once, not when a second pass is done to        optimize }        if (Insentry=nil) or ((InsEntry^.flags and IF_PASS2)<>0) then         begin           current_filepos:=fileinfo;           { We need intel style operands }           SetOperandOrder(op_intel);           { create the .ot fields }           create_ot(objdata);           { set the file postion }         end        else         begin           { we've already an insentry so it's valid }           result:=true;           exit;         end;        { Lookup opcode in the table }        InsSize:=-1;        i:=instabcache^[opcode];        if i=-1 then         begin           Message1(asmw_e_opcode_not_in_table,gas_op2str[opcode]);           exit;         end;        insentry:=@instab[i];        while (insentry^.opcode=opcode) do         begin           if matches(insentry) then             begin               result:=true;               exit;             end;           inc(insentry);         end;        Message1(asmw_e_invalid_opcode_and_operands,GetString);        { No instruction found, set insentry to nil and inssize to -1 }        insentry:=nil;        inssize:=-1;      end;    function taicpu.Pass1(objdata:TObjData):longint;      begin        Pass1:=0;        { Save the old offset and set the new offset }        InsOffset:=ObjData.CurrObjSec.Size;        { Error? }        if (Insentry=nil) and (InsSize=-1) then          exit;        { set the file postion }        current_filepos:=fileinfo;        { Get InsEntry }        if FindInsEntry(ObjData) then         begin           { Calculate instruction size }           InsSize:=calcsize(insentry);           if segprefix<>NR_NO then            inc(InsSize);           { Fix opsize if size if forced }           if (insentry^.flags and (IF_SB or IF_SW or IF_SD))<>0 then             begin               if (insentry^.flags and IF_ARMASK)=0 then                 begin                   if (insentry^.flags and IF_SB)<>0 then                     begin                       if opsize=S_NO then                         opsize:=S_B;                     end                   else if (insentry^.flags and IF_SW)<>0 then                     begin                       if opsize=S_NO then                         opsize:=S_W;                     end                   else if (insentry^.flags and IF_SD)<>0 then                     begin                       if opsize=S_NO then                         opsize:=S_L;                     end;                 end;             end;           LastInsOffset:=InsOffset;           Pass1:=InsSize;           exit;         end;        LastInsOffset:=-1;      end;    const      segprefixes: array[NR_CS..NR_GS] of Byte=(      //cs   ds   es   ss   fs   gs        $2E, $3E, $26, $36, $64, $65      );    procedure taicpu.Pass2(objdata:TObjData);      begin        { error in pass1 ? }        if insentry=nil then         exit;        current_filepos:=fileinfo;        { Segment override }        if (segprefix>=NR_CS) and (segprefix<=NR_GS) then         begin           objdata.writebytes(segprefixes[segprefix],1);           { fix the offset for GenNode }           inc(InsOffset);         end        else if segprefix<>NR_NO then          InternalError(201001071);        { Generate the instruction }        GenCode(objdata);      end;    function taicpu.needaddrprefix(opidx:byte):boolean;      begin        result:=(oper[opidx]^.typ=top_ref) and                (oper[opidx]^.ref^.refaddr=addr_no) and    {$ifdef x86_64}                (oper[opidx]^.ref^.base<>NR_RIP) and    {$endif x86_64}                (                 (                  (oper[opidx]^.ref^.index<>NR_NO) and                  (getsubreg(oper[opidx]^.ref^.index)<>R_SUBADDR)                 ) or                 (                  (oper[opidx]^.ref^.base<>NR_NO) and                  (getsubreg(oper[opidx]^.ref^.base)<>R_SUBADDR)                 )                );      end;    function regval(r:Tregister):byte;      const    {$ifdef x86_64}        opcode_table:array[tregisterindex] of tregisterindex = (          {$i r8664op.inc}        );    {$else x86_64}        opcode_table:array[tregisterindex] of tregisterindex = (          {$i r386op.inc}        );    {$endif x86_64}      var        regidx : tregisterindex;      begin        regidx:=findreg_by_number(r);        if regidx<>0 then          result:=opcode_table[regidx]        else          begin            Message1(asmw_e_invalid_register,generic_regname(r));            result:=0;          end;      end;{$ifdef x86_64}    function rexbits(r: tregister): byte;      begin        result:=0;        case getregtype(r) of          R_INTREGISTER:            if (getsupreg(r)>=RS_R8) then          { Either B,X or R bits can be set, depending on register role in instruction.            Set all three bits here, caller will discard unnecessary ones. }              result:=result or $47            else if (getsubreg(r)=R_SUBL) and              (getsupreg(r) in [RS_RDI,RS_RSI,RS_RBP,RS_RSP]) then              result:=result or $40            else if (getsubreg(r)=R_SUBH) then          { Not an actual REX bit, used to detect incompatible usage of            AH/BH/CH/DH }              result:=result or $80;          R_MMREGISTER:            if getsupreg(r)>=RS_XMM8 then              result:=result or $47;        end;      end;    function process_ea(const input:toper;out output:ea;rfield:longint):boolean;      var        sym   : tasmsymbol;        md,s,rv  : byte;        base,index,scalefactor,        o     : longint;        ir,br : Tregister;        isub,bsub : tsubregister;      begin        process_ea:=false;        fillchar(output,sizeof(output),0);        {Register ?}        if (input.typ=top_reg) then          begin            rv:=regval(input.reg);            output.modrm:=$c0 or (rfield shl 3) or rv;            output.size:=1;            output.rex:=output.rex or (rexbits(input.reg) and $F1);            process_ea:=true;            exit;         end;        {No register, so memory reference.}        if input.typ<>top_ref then          internalerror(200409263);        ir:=input.ref^.index;        br:=input.ref^.base;        isub:=getsubreg(ir);        bsub:=getsubreg(br);        s:=input.ref^.scalefactor;        o:=input.ref^.offset;        sym:=input.ref^.symbol;        if ((ir<>NR_NO) and (getregtype(ir)<>R_INTREGISTER)) or           ((br<>NR_NO) and (br<>NR_RIP) and (getregtype(br)<>R_INTREGISTER)) then          internalerror(200301081);        { it's direct address }        if (br=NR_NO) and (ir=NR_NO) then         begin           output.sib_present:=true;           output.bytes:=4;           output.modrm:=4 or (rfield shl 3);           output.sib:=$25;         end        else if (br=NR_RIP) and (ir=NR_NO) then          begin            { rip based }            output.sib_present:=false;            output.bytes:=4;            output.modrm:=5 or (rfield shl 3);          end        else        { it's an indirection }         begin           { 16 bit or 32 bit address? }           if ((ir<>NR_NO) and (isub<>R_SUBADDR)) or              ((br<>NR_NO) and (bsub<>R_SUBADDR)) then             message(asmw_e_16bit_32bit_not_supported);           { wrong, for various reasons }           if (ir=NR_ESP) or ((s<>1) and (s<>2) and (s<>4) and (s<>8) and (ir<>NR_NO)) then            exit;           output.rex:=output.rex or (rexbits(br) and $F1) or (rexbits(ir) and $F2);           process_ea:=true;           { base }           case br of             NR_R8,             NR_RAX : base:=0;             NR_R9,             NR_RCX : base:=1;             NR_R10,             NR_RDX : base:=2;             NR_R11,             NR_RBX : base:=3;             NR_R12,             NR_RSP : base:=4;             NR_R13,             NR_NO,             NR_RBP : base:=5;             NR_R14,             NR_RSI : base:=6;             NR_R15,             NR_RDI : base:=7;           else             exit;           end;           { index }           case ir of             NR_R8,             NR_RAX : index:=0;             NR_R9,             NR_RCX : index:=1;             NR_R10,             NR_RDX : index:=2;             NR_R11,             NR_RBX : index:=3;             NR_R12,             NR_NO  : index:=4;             NR_R13,             NR_RBP : index:=5;             NR_R14,             NR_RSI : index:=6;             NR_R15,             NR_RDI : index:=7;           else             exit;           end;           case s of            0,            1 : scalefactor:=0;            2 : scalefactor:=1;            4 : scalefactor:=2;            8 : scalefactor:=3;           else            exit;           end;           { If rbp or r13 is used we must always include an offset }           if (br=NR_NO) or              ((br<>NR_RBP) and (br<>NR_R13) and (o=0) and (sym=nil)) then            md:=0           else            if ((o>=-128) and (o<=127) and (sym=nil)) then             md:=1            else             md:=2;           if (br=NR_NO) or (md=2) then            output.bytes:=4           else            output.bytes:=md;           { SIB needed ? }           if (ir=NR_NO) and (br<>NR_RSP) and (br<>NR_R12) then            begin              output.sib_present:=false;              output.modrm:=(md shl 6) or (rfield shl 3) or base;            end           else            begin              output.sib_present:=true;              output.modrm:=(md shl 6) or (rfield shl 3) or 4;              output.sib:=(scalefactor shl 6) or (index shl 3) or base;            end;         end;        output.size:=1+ord(output.sib_present)+output.bytes;        process_ea:=true;      end;{$else x86_64}    function process_ea(const input:toper;out output:ea;rfield:longint):boolean;      var        sym   : tasmsymbol;        md,s,rv  : byte;        base,index,scalefactor,        o     : longint;        ir,br : Tregister;        isub,bsub : tsubregister;      begin        process_ea:=false;        fillchar(output,sizeof(output),0);        {Register ?}        if (input.typ=top_reg) then          begin            rv:=regval(input.reg);            output.modrm:=$c0 or (rfield shl 3) or rv;            output.size:=1;            process_ea:=true;            exit;         end;        {No register, so memory reference.}        if (input.typ<>top_ref) then          internalerror(200409262);        if ((input.ref^.index<>NR_NO) and (getregtype(input.ref^.index)<>R_INTREGISTER)) or           ((input.ref^.base<>NR_NO) and (getregtype(input.ref^.base)<>R_INTREGISTER)) then          internalerror(200301081);        ir:=input.ref^.index;        br:=input.ref^.base;        isub:=getsubreg(ir);        bsub:=getsubreg(br);        s:=input.ref^.scalefactor;        o:=input.ref^.offset;        sym:=input.ref^.symbol;      { it's direct address }        if (br=NR_NO) and (ir=NR_NO) then         begin           { it's a pure offset }           output.sib_present:=false;           output.bytes:=4;           output.modrm:=5 or (rfield shl 3);         end        else        { it's an indirection }         begin           { 16 bit address? }           if ((ir<>NR_NO) and (isub<>R_SUBADDR)) or              ((br<>NR_NO) and (bsub<>R_SUBADDR)) then             message(asmw_e_16bit_not_supported);{$ifdef OPTEA}           { make single reg base }           if (br=NR_NO) and (s=1) then            begin              br:=ir;              ir:=NR_NO;            end;           { convert [3,5,9]*EAX to EAX+[2,4,8]*EAX }           if (br=NR_NO) and              (((s=2) and (ir<>NR_ESP)) or                (s=3) or (s=5) or (s=9)) then            begin              br:=ir;              dec(s);            end;           { swap ESP into base if scalefactor is 1 }           if (s=1) and (ir=NR_ESP) then            begin              ir:=br;              br:=NR_ESP;            end;{$endif OPTEA}           { wrong, for various reasons }           if (ir=NR_ESP) or ((s<>1) and (s<>2) and (s<>4) and (s<>8) and (ir<>NR_NO)) then            exit;           { base }           case br of             NR_EAX : base:=0;             NR_ECX : base:=1;             NR_EDX : base:=2;             NR_EBX : base:=3;             NR_ESP : base:=4;             NR_NO,             NR_EBP : base:=5;             NR_ESI : base:=6;             NR_EDI : base:=7;           else             exit;           end;           { index }           case ir of             NR_EAX : index:=0;             NR_ECX : index:=1;             NR_EDX : index:=2;             NR_EBX : index:=3;             NR_NO  : index:=4;             NR_EBP : index:=5;             NR_ESI : index:=6;             NR_EDI : index:=7;           else             exit;           end;           case s of            0,            1 : scalefactor:=0;            2 : scalefactor:=1;            4 : scalefactor:=2;            8 : scalefactor:=3;           else            exit;           end;           if (br=NR_NO) or              ((br<>NR_EBP) and (o=0) and (sym=nil)) then            md:=0           else            if ((o>=-128) and (o<=127) and (sym=nil)) then             md:=1            else             md:=2;           if (br=NR_NO) or (md=2) then            output.bytes:=4           else            output.bytes:=md;           { SIB needed ? }           if (ir=NR_NO) and (br<>NR_ESP) then            begin              output.sib_present:=false;              output.modrm:=(longint(md) shl 6) or (rfield shl 3) or base;            end           else            begin              output.sib_present:=true;              output.modrm:=(longint(md) shl 6) or (rfield shl 3) or 4;              output.sib:=(scalefactor shl 6) or (index shl 3) or base;            end;         end;        if output.sib_present then         output.size:=2+output.bytes        else         output.size:=1+output.bytes;        process_ea:=true;      end;{$endif x86_64}    function taicpu.calcsize(p:PInsEntry):shortint;      var        codes : pchar;        c     : byte;        len     : shortint;        ea_data : ea;        exists_vex: boolean;        exists_vex_extention: boolean;        exists_prefix_66: boolean;        exists_prefix_F2: boolean;        exists_prefix_F3: boolean;{$ifdef x86_64}        omit_rexw : boolean;{$endif x86_64}      begin        len:=0;        codes:=@p^.code[0];        exists_vex := false;        exists_vex_extention := false;        exists_prefix_66 := false;        exists_prefix_F2 := false;        exists_prefix_F3 := false;{$ifdef x86_64}        rex:=0;        omit_rexw:=false;{$endif x86_64}        repeat          c:=ord(codes^);          inc(codes);          case c of            0 :              break;            1,2,3 :              begin                inc(codes,c);                inc(len,c);              end;            8,9,10 :              begin{$ifdef x86_64}                rex:=rex or (rexbits(oper[c-8]^.reg) and $F1);{$endif x86_64}                inc(codes);                inc(len);              end;            11 :              begin                inc(codes);                inc(len);              end;            4,5,6,7 :              begin                if opsize=S_W then                  inc(len,2)                else                  inc(len);              end;            12,13,14,            16,17,18,            20,21,22,23,            40,41,42 :              inc(len);            24,25,26,            31,            48,49,50 :              inc(len,2);            28,29,30:              begin                if opsize=S_Q then                  inc(len,8)                else                  inc(len,4);              end;            36,37,38:              inc(len,sizeof(pint));            44,45,46:              inc(len,8);            32,33,34,            52,53,54,            56,57,58,            172,173,174 :              inc(len,4);            60,61,62,63: ; // ignore vex-coded operand-idx            208,209,210 :              begin                case (oper[c-208]^.ot and OT_SIZE_MASK) of                  OT_BITS16:                    inc(len);{$ifdef x86_64}                  OT_BITS64:                    begin                      rex:=rex or $48;                    end;{$endif x86_64}                end;              end;            200 :{$ifndef x86_64}              inc(len);{$else x86_64}              { every insentry with code 0310 must be marked with NOX86_64 }              InternalError(2011051301);{$endif x86_64}            201 :{$ifdef x86_64}              inc(len){$endif x86_64}              ;            212 :              inc(len);            214 :              begin{$ifdef x86_64}                rex:=rex or $48;{$endif x86_64}              end;            202,            211,            213,            215,            217,218: ;            219:              begin                inc(len);                exists_prefix_F2 := true;              end;            220:              begin                inc(len);                exists_prefix_F3 := true;              end;            241:              begin                inc(len);                exists_prefix_66 := true;              end;            221:{$ifdef x86_64}              omit_rexw:=true{$endif x86_64}              ;            64..151 :              begin{$ifdef x86_64}                 if (c<127) then                  begin                    if (oper[c and 7]^.typ=top_reg) then                      begin                        rex:=rex or (rexbits(oper[c and 7]^.reg) and $F4);                      end;                  end;{$endif x86_64}                if not process_ea(oper[(c shr 3) and 7]^, ea_data, 0) then                  Message(asmw_e_invalid_effective_address)                else                  inc(len,ea_data.size);{$ifdef x86_64}                rex:=rex or ea_data.rex;{$endif x86_64}              end;            242: // VEX prefix for AVX (length = 2 or 3 bytes, dependens on REX.XBW or opcode-prefix ($0F38 or $0F3A))                 // =>> DEFAULT = 2 Bytes              begin                if not(exists_vex) then                begin                  inc(len, 2);                  exists_vex := true;                end;              end;            243: // REX.W = 1                 // =>> VEX prefix length = 3              begin                if not(exists_vex_extention) then                begin                  inc(len);                  exists_vex_extention := true;                end;              end;            244: ; // VEX length bit            247: inc(len); // operand 3 (ymmreg) encoded immediate byte (bit 4-7)            248: // VEX-Extention prefix $0F                 // ignore for calculating length                 ;            249, // VEX-Extention prefix $0F38            250: // VEX-Extention prefix $0F3A              begin                if not(exists_vex_extention) then                begin                  inc(len);                  exists_vex_extention := true;                end;              end;            else             InternalError(200603141);          end;        until false;{$ifdef x86_64}        if ((rex and $80)<>0) and ((rex and $4F)<>0) then          Message(asmw_e_bad_reg_with_rex);        rex:=rex and $4F;      { reset extra bits in upper nibble }        if omit_rexw then          begin            if rex=$48 then    { remove rex entirely? }              rex:=0            else              rex:=rex and $F7;          end;        if not(exists_vex) then         begin          if rex<>0 then            Inc(len);        end;{$endif}        if exists_vex then        begin          if exists_prefix_66 then dec(len);          if exists_prefix_F2 then dec(len);          if exists_prefix_F3 then dec(len);  {$ifdef x86_64}          if not(exists_vex_extention) then            if rex and $0B <> 0 then inc(len);  // REX.WXB <> 0 =>> needed VEX-Extention  {$endif x86_64}        end;        calcsize:=len;      end;    procedure taicpu.GenCode(objdata:TObjData);      {       * the actual codes (C syntax, i.e. octal):       * \0            - terminates the code. (Unless it's a literal of course.)       * \1, \2, \3    - that many literal bytes follow in the code stream       * \4, \6        - the POP/PUSH (respectively) codes for CS, DS, ES, SS       *                 (POP is never used for CS) depending on operand 0       * \5, \7        - the second byte of POP/PUSH codes for FS, GS, depending       *                 on operand 0       * \10, \11, \12 - a literal byte follows in the code stream, to be added       *                 to the register value of operand 0, 1 or 2       * \13           - a literal byte follows in the code stream, to be added       *                 to the condition code value of the instruction.       * \14, \15, \16 - a signed byte immediate operand, from operand 0, 1 or 2       * \20, \21, \22 - a byte immediate operand, from operand 0, 1 or 2       * \24, \25, \26, \27 - an unsigned byte immediate operand, from operand 0, 1, 2 or 3       * \30, \31, \32 - a word immediate operand, from operand 0, 1 or 2       * \34, \35, \36 - select between \3[012] and \4[012] depending on 16/32 bit       *                 assembly mode or the address-size override on the operand       * \37           - a word constant, from the _segment_ part of operand 0       * \40, \41, \42 - a long immediate operand, from operand 0, 1 or 2       * \44, \45, \46 - select between \3[012], \4[012] or \5[456] depending                         on the address size of instruction       * \50, \51, \52 - a byte relative operand, from operand 0, 1 or 2       * \54, \55, \56 - a qword immediate, from operand 0, 1 or 2       * \60, \61, \62 - a word relative operand, from operand 0, 1 or 2       * \64, \65, \66 - select between \6[012] and \7[012] depending on 16/32 bit       *                 assembly mode or the address-size override on the operand       * \70, \71, \72 - a long relative operand, from operand 0, 1 or 2       * \74, \75, \76 - a vex-coded vector operand, from operand 0, 1 or 2       * \1ab          - a ModRM, calculated on EA in operand a, with the spare       *                 field the register value of operand b.       * \2ab          - a ModRM, calculated on EA in operand a, with the spare       *                 field equal to digit b.       * \254,\255,\256 - a signed 32-bit immediate to be extended to 64 bits       * \300,\301,\302 - might be an 0x67, depending on the address size of       *                 the memory reference in operand x.       * \310          - indicates fixed 16-bit address size, i.e. optional 0x67.       * \311          - indicates fixed 32-bit address size, i.e. optional 0x67.       * \312          - (disassembler only) invalid with non-default address size.       * \320,\321,\322 - might be an 0x66 or 0x48 byte, depending on the operand       *                 size of operand x.       * \324          - indicates fixed 16-bit operand size, i.e. optional 0x66.       * \325          - indicates fixed 32-bit operand size, i.e. optional 0x66.       * \326          - indicates fixed 64-bit operand size, i.e. optional 0x48.       * \327          - indicates that this instruction is only valid when the       *                 operand size is the default (instruction to disassembler,       *                 generates no code in the assembler)       * \331          - instruction not valid with REP prefix.  Hint for       *                 disassembler only; for SSE instructions.       * \332	       - disassemble a rep (0xF3 byte) prefix as repe not rep.       * \333          - 0xF3 prefix for SSE instructions       * \334          - 0xF2 prefix for SSE instructions       * \335          - Indicates 64-bit operand size with REX.W not necessary       * \361          - 0x66 prefix for SSE instructions       * \362          - VEX prefix for AVX instructions       * \363          - VEX W1       * \364          - VEX Vector length 256       * \367          - operand 3 (ymmreg) encoded in bit 4-7 of the immediate byte       * \370          - VEX 0F-FLAG       * \371          - VEX 0F38-FLAG       * \372          - VEX 0F3A-FLAG      }      var        currval : aint;        currsym : tobjsymbol;        currrelreloc,        currabsreloc,        currabsreloc32 : TObjRelocationType;{$ifdef x86_64}        rexwritten : boolean;{$endif x86_64}        procedure getvalsym(opidx:longint);          begin            case oper[opidx]^.typ of              top_ref :                begin                  currval:=oper[opidx]^.ref^.offset;                  currsym:=ObjData.symbolref(oper[opidx]^.ref^.symbol);{$ifdef i386}                  if (oper[opidx]^.ref^.refaddr=addr_pic) and                     (tf_pic_uses_got in target_info.flags) then                    begin                      currrelreloc:=RELOC_PLT32;                      currabsreloc:=RELOC_GOT32;                      currabsreloc32:=RELOC_GOT32;                    end                  else{$endif i386}{$ifdef x86_64}                  if oper[opidx]^.ref^.refaddr=addr_pic then                    begin                      currrelreloc:=RELOC_PLT32;                      currabsreloc:=RELOC_GOTPCREL;                      currabsreloc32:=RELOC_GOTPCREL;                    end                  else if oper[opidx]^.ref^.refaddr=addr_pic_no_got then                    begin                      currrelreloc:=RELOC_RELATIVE;                      currabsreloc:=RELOC_RELATIVE;                      currabsreloc32:=RELOC_RELATIVE;                    end                  else{$endif x86_64}                    begin                      currrelreloc:=RELOC_RELATIVE;                      currabsreloc:=RELOC_ABSOLUTE;                      currabsreloc32:=RELOC_ABSOLUTE32;                    end;                end;              top_const :                begin                  currval:=aint(oper[opidx]^.val);                  currsym:=nil;                  currabsreloc:=RELOC_ABSOLUTE;                  currabsreloc32:=RELOC_ABSOLUTE32;                end;              else                Message(asmw_e_immediate_or_reference_expected);            end;          end;{$ifdef x86_64}       procedure maybewriterex;       begin          if (rex<>0) and not(rexwritten) then            begin              rexwritten:=true;              objdata.writebytes(rex,1);            end;        end;{$endif x86_64}       procedure objdata_writereloc(Data:aint;len:aword;p:TObjSymbol;Reloctype:TObjRelocationType);         begin{$ifdef i386}               { Special case of '_GLOBAL_OFFSET_TABLE_'                 which needs a special relocation type R_386_GOTPC }               if assigned (p) and                  (p.name='_GLOBAL_OFFSET_TABLE_') and                  (tf_pic_uses_got in target_info.flags) then                 begin                   { nothing else than a 4 byte relocation should occur                     for GOT }                   if len<>4 then                     Message1(asmw_e_invalid_opcode_and_operands,GetString);                   Reloctype:=RELOC_GOTPC;                   { We need to add the offset of the relocation                     of _GLOBAL_OFFSET_TABLE symbol within                     the current instruction }                   inc(data,objdata.currobjsec.size-insoffset);                 end;{$endif i386}           objdata.writereloc(data,len,p,Reloctype);         end;      const        CondVal:array[TAsmCond] of byte=($0,         $7, $3, $2, $6, $2, $4, $F, $D, $C, $E, $6, $2,         $3, $7, $3, $5, $E, $C, $D, $F, $1, $B, $9, $5,         $0, $A, $A, $B, $8, $4);      var        c : byte;        pb : pbyte;        codes : pchar;        bytes : array[0..3] of byte;        rfield,        data,s,opidx : longint;        ea_data : ea;        relsym : TObjSymbol;        needed_VEX_Extention: boolean;        needed_VEX: boolean;        opmode: integer;        VEXvvvv: byte;        VEXmmmmm: byte;      begin        { safety check }        if objdata.currobjsec.size<>longword(insoffset) then           internalerror(200130121);        { load data to write }        codes:=insentry^.code;{$ifdef x86_64}        rexwritten:=false;{$endif x86_64}        { Force word push/pop for registers }        if (opsize=S_W) and ((codes[0]=#4) or (codes[0]=#6) or            ((codes[0]=#1) and ((codes[2]=#5) or (codes[2]=#7)))) then        begin          bytes[0]:=$66;          objdata.writebytes(bytes,1);        end;        // needed VEX Prefix (for AVX etc.)        needed_VEX := false;        needed_VEX_Extention := false;        opmode   := -1;        VEXvvvv  := 0;        VEXmmmmm := 0;        repeat          c:=ord(codes^);          inc(codes);          case c of              0: break;              1,              2,              3: inc(codes,c);             60: opmode := 0;             61: opmode := 1;             62: opmode := 2;            219: VEXvvvv                := VEXvvvv  OR $02; // set SIMD-prefix $F3            220: VEXvvvv                := VEXvvvv  OR $03; // set SIMD-prefix $F2            241: VEXvvvv                := VEXvvvv  OR $01; // set SIMD-prefix $66            242: needed_VEX             := true;            243: begin                   needed_VEX_Extention := true;                   VEXvvvv              := VEXvvvv  OR (1 shl 7); // set REX.W                 end;            244: VEXvvvv                := VEXvvvv  OR $04; // vectorlength = 256 bits AND no scalar            248: VEXmmmmm               := VEXmmmmm OR $01; // set leading opcode byte $0F            249: begin                   needed_VEX_Extention := true;                   VEXmmmmm             := VEXmmmmm OR $02; // set leading opcode byte $0F38                 end;            250: begin                   needed_VEX_Extention := true;                   VEXmmmmm             := VEXmmmmm OR $03; // set leading opcode byte $0F3A                 end;          end;        until false;        if needed_VEX then        begin          if (opmode > ops) or             (opmode < -1) then          begin            Internalerror(777100);          end          else if opmode = -1 then          begin            VEXvvvv := VEXvvvv or ($0F shl 3); // set VEXvvvv bits (bits 6-3) to 1          end          else if oper[opmode]^.typ = top_reg then          begin            VEXvvvv := VEXvvvv or ((not(regval(oper[opmode]^.reg)) and $07) shl 3);            {$ifdef x86_64}              if rexbits(oper[opmode]^.reg) = 0 then VEXvvvv := VEXvvvv or (1 shl 6);            {$else}              VEXvvvv := VEXvvvv or (1 shl 6);            {$endif x86_64}          end          else Internalerror(777101);          if not(needed_VEX_Extention) then          begin            {$ifdef x86_64}              if rex and $0B <> 0 then needed_VEX_Extention := true;            {$endif x86_64}          end;          if needed_VEX_Extention then          begin            // VEX-Prefix-Length = 3 Bytes            bytes[0]:=$C4;            objdata.writebytes(bytes,1);            {$ifdef x86_64}              VEXmmmmm := VEXmmmmm or ((not(rex) and $07) shl 5);  // set REX.rxb            {$else}              VEXmmmmm := VEXmmmmm or (7 shl 5);  //            {$endif x86_64}              bytes[0] := VEXmmmmm;              objdata.writebytes(bytes,1);            {$ifdef x86_64}              VEXvvvv  := VEXvvvv OR ((rex and $08) shl 7);   // set REX.w            {$endif x86_64}            bytes[0] := VEXvvvv;            objdata.writebytes(bytes,1);          end          else          begin            // VEX-Prefix-Length = 2 Bytes            bytes[0]:=$C5;            objdata.writebytes(bytes,1);            {$ifdef x86_64}              if rex and $04 = 0 then            {$endif x86_64}            begin              VEXvvvv := VEXvvvv or (1 shl 7);            end;            bytes[0] := VEXvvvv;            objdata.writebytes(bytes,1);          end;        end        else        begin          needed_VEX_Extention := false;          opmode := -1;        end;        { load data to write }        codes:=insentry^.code;        repeat          c:=ord(codes^);          inc(codes);          case c of            0 :              break;            1,2,3 :              begin{$ifdef x86_64}                if not(needed_VEX) then  // TG                  maybewriterex;{$endif x86_64}                objdata.writebytes(codes^,c);                inc(codes,c);              end;            4,6 :              begin                case oper[0]^.reg of                  NR_CS:                    bytes[0]:=$e;                  NR_NO,                  NR_DS:                    bytes[0]:=$1e;                  NR_ES:                    bytes[0]:=$6;                  NR_SS:                    bytes[0]:=$16;                  else                    internalerror(777004);                end;                if c=4 then                  inc(bytes[0]);                objdata.writebytes(bytes,1);              end;            5,7 :              begin                case oper[0]^.reg of                  NR_FS:                    bytes[0]:=$a0;                  NR_GS:                    bytes[0]:=$a8;                  else                    internalerror(777005);                end;                if c=5 then                  inc(bytes[0]);                objdata.writebytes(bytes,1);              end;            8,9,10 :              begin{$ifdef x86_64}                if not(needed_VEX) then  // TG                  maybewriterex;{$endif x86_64}                bytes[0]:=ord(codes^)+regval(oper[c-8]^.reg);                inc(codes);                objdata.writebytes(bytes,1);              end;            11 :              begin                bytes[0]:=ord(codes^)+condval[condition];                inc(codes);                objdata.writebytes(bytes,1);              end;            12,13,14 :              begin                getvalsym(c-12);                if (currval<-128) or (currval>127) then                 Message2(asmw_e_value_exceeds_bounds,'signed byte',tostr(currval));                if assigned(currsym) then                  objdata_writereloc(currval,1,currsym,currabsreloc)                else                  objdata.writebytes(currval,1);              end;            16,17,18 :              begin                getvalsym(c-16);                if (currval<-256) or (currval>255) then                 Message2(asmw_e_value_exceeds_bounds,'byte',tostr(currval));                if assigned(currsym) then                 objdata_writereloc(currval,1,currsym,currabsreloc)                else                 objdata.writebytes(currval,1);              end;            20,21,22,23 :              begin                getvalsym(c-20);                if (currval<0) or (currval>255) then                 Message2(asmw_e_value_exceeds_bounds,'unsigned byte',tostr(currval));                if assigned(currsym) then                 objdata_writereloc(currval,1,currsym,currabsreloc)                else                 objdata.writebytes(currval,1);              end;            24,25,26 :     // 030..032              begin                getvalsym(c-24);                if (currval<-65536) or (currval>65535) then                 Message2(asmw_e_value_exceeds_bounds,'word',tostr(currval));                if assigned(currsym) then                 objdata_writereloc(currval,2,currsym,currabsreloc)                else                 objdata.writebytes(currval,2);              end;            28,29,30 :     // 034..036              { !!! These are intended (and used in opcode table) to select depending                    on address size, *not* operand size. Works by coincidence only. }              begin                getvalsym(c-28);                if opsize=S_Q then                  begin                    if assigned(currsym) then                     objdata_writereloc(currval,8,currsym,currabsreloc)                    else                     objdata.writebytes(currval,8);                  end                else                  begin                    if assigned(currsym) then                      objdata_writereloc(currval,4,currsym,currabsreloc32)                    else                      objdata.writebytes(currval,4);                  end              end;            32,33,34 :    // 040..042              begin                getvalsym(c-32);                if assigned(currsym) then                 objdata_writereloc(currval,4,currsym,currabsreloc32)                else                 objdata.writebytes(currval,4);              end;            36,37,38 :   // 044..046 - select between word/dword/qword depending on              begin      // address size (we support only default address sizes).                getvalsym(c-36);{$ifdef x86_64}                if assigned(currsym) then                  objdata_writereloc(currval,8,currsym,currabsreloc)                else                  objdata.writebytes(currval,8);{$else x86_64}                if assigned(currsym) then                  objdata_writereloc(currval,4,currsym,currabsreloc32)                else                  objdata.writebytes(currval,4);{$endif x86_64}              end;            40,41,42 :   // 050..052 - byte relative operand              begin                getvalsym(c-40);                data:=currval-insend;{$push}{$r-}                if assigned(currsym) then                 inc(data,currsym.address);{$pop}                if (data>127) or (data<-128) then                 Message1(asmw_e_short_jmp_out_of_range,tostr(data));                objdata.writebytes(data,1);              end;            44,45,46:   // 054..056 - qword immediate operand              begin                getvalsym(c-44);                if assigned(currsym) then                  objdata_writereloc(currval,8,currsym,currabsreloc)                else                  objdata.writebytes(currval,8);              end;            52,53,54 :  // 064..066 - select between 16/32 address mode, but we support only 32              begin                getvalsym(c-52);                if assigned(currsym) then                 objdata_writereloc(currval,4,currsym,currrelreloc)                else                 objdata_writereloc(currval-insend,4,nil,currabsreloc32)              end;            56,57,58 :  // 070..072 - long relative operand              begin                getvalsym(c-56);                if assigned(currsym) then                 objdata_writereloc(currval,4,currsym,currrelreloc)                else                 objdata_writereloc(currval-insend,4,nil,currabsreloc32)              end;            60,61,62 : ; // 074..076 - vex-coded vector operand                         // ignore            172,173,174 :  // 0254..0256 - dword implicitly sign-extended to 64-bit (x86_64 only)              begin                getvalsym(c-172);{$ifdef x86_64}                { for i386 as aint type is longint the                  following test is useless }                if (currval<low(longint)) or (currval>high(longint)) then                  Message2(asmw_e_value_exceeds_bounds,'signed dword',tostr(currval));{$endif x86_64}                if assigned(currsym) then                  objdata_writereloc(currval,4,currsym,currabsreloc32)                else                  objdata.writebytes(currval,4);              end;            200 :   { fixed 16-bit addr }{$ifndef x86_64}              begin                bytes[0]:=$67;                objdata.writebytes(bytes,1);              end;{$else x86_64}              { every insentry having code 0310 must be marked with NOX86_64 }              InternalError(2011051302);{$endif}            201 :   { fixed 32-bit addr }{$ifdef x86_64}              begin                bytes[0]:=$67;                objdata.writebytes(bytes,1);              end{$endif x86_64}               ;            208,209,210 :              begin                case oper[c-208]^.ot and OT_SIZE_MASK of                  OT_BITS16 :                    begin                      bytes[0]:=$66;                      objdata.writebytes(bytes,1);                    end;{$ifndef x86_64}                  OT_BITS64 :                      Message(asmw_e_64bit_not_supported);{$endif x86_64}                end;              end;            211,            213 : {no action needed};            212,            241:              begin                if not(needed_VEX) then                begin                  bytes[0]:=$66;                  objdata.writebytes(bytes,1);                end;              end;            214 :              begin{$ifndef x86_64}                Message(asmw_e_64bit_not_supported);{$endif x86_64}              end;            219 :              begin                if not(needed_VEX) then                begin                  bytes[0]:=$f3;                  objdata.writebytes(bytes,1);                end;              end;            220 :              begin                if not(needed_VEX) then                begin                  bytes[0]:=$f2;                  objdata.writebytes(bytes,1);                end;              end;            221:              ;            202,            215,            217,218 :              begin                { these are dissambler hints or 32 bit prefixes which                  are not needed }              end;            242..244: ; // VEX flags =>> nothing todo                 247: begin                        if needed_VEX then                        begin                          if ops = 4 then                          begin                            if (oper[3]^.typ=top_reg) then                            begin                              if (oper[3]^.ot and otf_reg_xmm <> 0) or                                 (oper[3]^.ot and otf_reg_ymm <> 0) then                              begin                                bytes[0] := ((getsupreg(oper[3]^.reg) and 15) shl 4);                                objdata.writebytes(bytes,1);                              end                              else Internalerror(777102);                            end                            else Internalerror(777103);                          end                          else Internalerror(777104);                        end                        else Internalerror(777105);                      end;            248..250: ; // VEX flags =>> nothing todo            31,            48,49,50 :              begin                InternalError(777006);              end            else              begin                { rex should be written at this point }{$ifdef x86_64}                if not(needed_VEX) then  // TG                  if (rex<>0) and not(rexwritten) then                    internalerror(200603191);{$endif x86_64}                if (c>=64) and (c<=151) then  // 0100..0227                 begin                   if (c<127) then            // 0177                    begin                      if (oper[c and 7]^.typ=top_reg) then                        rfield:=regval(oper[c and 7]^.reg)                      else                        rfield:=regval(oper[c and 7]^.ref^.base);                    end                   else                    rfield:=c and 7;                   opidx:=(c shr 3) and 7;                   if not process_ea(oper[opidx]^,ea_data,rfield) then                     Message(asmw_e_invalid_effective_address);                   pb:=@bytes[0];                   pb^:=ea_data.modrm;                   inc(pb);                   if ea_data.sib_present then                    begin                      pb^:=ea_data.sib;                      inc(pb);                    end;                   s:=pb-@bytes[0];                   objdata.writebytes(bytes,s);                   case ea_data.bytes of                     0 : ;                     1 :                       begin                         if (oper[opidx]^.ot and OT_MEMORY)=OT_MEMORY then                           begin                             currsym:=objdata.symbolref(oper[opidx]^.ref^.symbol);{$ifdef i386}                             if (oper[opidx]^.ref^.refaddr=addr_pic) and                                (tf_pic_uses_got in target_info.flags) then                               currabsreloc:=RELOC_GOT32                             else{$endif i386}{$ifdef x86_64}                             if oper[opidx]^.ref^.refaddr=addr_pic then                               currabsreloc:=RELOC_GOTPCREL                             else{$endif x86_64}                               currabsreloc:=RELOC_ABSOLUTE;                             objdata_writereloc(oper[opidx]^.ref^.offset,1,currsym,currabsreloc);                           end                         else                          begin                            bytes[0]:=oper[opidx]^.ref^.offset;                            objdata.writebytes(bytes,1);                          end;                         inc(s);                       end;                     2,4 :                       begin                         currsym:=objdata.symbolref(oper[opidx]^.ref^.symbol);                         currval:=oper[opidx]^.ref^.offset;{$ifdef x86_64}                         if oper[opidx]^.ref^.refaddr=addr_pic then                           currabsreloc:=RELOC_GOTPCREL                         else                           if oper[opidx]^.ref^.base=NR_RIP then                             begin                               currabsreloc:=RELOC_RELATIVE;                               { Adjust reloc value by number of bytes following the displacement,                                 but not if displacement is specified by literal constant }                               if Assigned(currsym) then                                 Dec(currval,InsEnd-objdata.CurrObjSec.Size-ea_data.bytes);                             end                           else{$endif x86_64}{$ifdef i386}                         if (oper[opidx]^.ref^.refaddr=addr_pic) and                            (tf_pic_uses_got in target_info.flags) then                           currabsreloc:=RELOC_GOT32                         else{$endif i386}                             currabsreloc:=RELOC_ABSOLUTE32;                           if (currabsreloc=RELOC_ABSOLUTE32) and                            (Assigned(oper[opidx]^.ref^.relsymbol)) then                           begin                             relsym:=objdata.symbolref(oper[opidx]^.ref^.relsymbol);                             if relsym.objsection=objdata.CurrObjSec then                               begin                                 currval:=objdata.CurrObjSec.size+ea_data.bytes-relsym.offset+currval;                                 currabsreloc:=RELOC_RELATIVE;                               end                             else                               begin                                 currabsreloc:=RELOC_PIC_PAIR;                                 currval:=relsym.offset;                               end;                           end;                         objdata_writereloc(currval,ea_data.bytes,currsym,currabsreloc);                         inc(s,ea_data.bytes);                       end;                   end;                 end                else                 InternalError(777007);              end;          end;        until false;      end;    function taicpu.is_same_reg_move(regtype: Tregistertype):boolean;      begin        result:=(((opcode=A_MOV) or (opcode=A_XCHG)) and                 (regtype = R_INTREGISTER) and                 (ops=2) and                 (oper[0]^.typ=top_reg) and                 (oper[1]^.typ=top_reg) and                 (oper[0]^.reg=oper[1]^.reg)                ) or                (((opcode=A_MOVSS) or (opcode=A_MOVSD) or (opcode=A_MOVQ) or                  (opcode=A_MOVAPS) or (OPCODE=A_MOVAPD)) and                 (regtype = R_MMREGISTER) and                 (ops=2) and                 (oper[0]^.typ=top_reg) and                 (oper[1]^.typ=top_reg) and                 (oper[0]^.reg=oper[1]^.reg)                );      end;    procedure build_spilling_operation_type_table;      var        opcode : tasmop;        i      : integer;      begin        new(operation_type_table);        fillchar(operation_type_table^,sizeof(toperation_type_table),byte(operand_read));        for opcode:=low(tasmop) to high(tasmop) do          begin            for i:=1 to MaxInsChanges do              begin                case InsProp[opcode].Ch[i] of                  Ch_Rop1 :                    operation_type_table^[opcode,0]:=operand_read;                  Ch_Wop1 :                    operation_type_table^[opcode,0]:=operand_write;                  Ch_RWop1,                  Ch_Mop1 :                    operation_type_table^[opcode,0]:=operand_readwrite;                  Ch_Rop2 :                    operation_type_table^[opcode,1]:=operand_read;                  Ch_Wop2 :                    operation_type_table^[opcode,1]:=operand_write;                  Ch_RWop2,                  Ch_Mop2 :                    operation_type_table^[opcode,1]:=operand_readwrite;                  Ch_Rop3 :                    operation_type_table^[opcode,2]:=operand_read;                  Ch_Wop3 :                    operation_type_table^[opcode,2]:=operand_write;                  Ch_RWop3,                  Ch_Mop3 :                    operation_type_table^[opcode,2]:=operand_readwrite;                end;              end;          end;        { Special cases that can't be decoded from the InsChanges flags }        operation_type_table^[A_IMUL,1]:=operand_readwrite;      end;    function taicpu.spilling_get_operation_type(opnr: longint): topertype;      begin        { the information in the instruction table is made for the string copy          operation MOVSD so hack here (FK)        }        if (opcode=A_MOVSD) and (ops=2) then          begin            case opnr of              0:                result:=operand_read;              1:                result:=operand_write;              else                internalerror(200506055);            end          end        else          result:=operation_type_table^[opcode,opnr];      end;    function spilling_create_load(const ref:treference;r:tregister):Taicpu;      begin        case getregtype(r) of          R_INTREGISTER :            { we don't need special code here for 32 bit loads on x86_64, since              those will automatically zero-extend the upper 32 bits. }            result:=taicpu.op_ref_reg(A_MOV,reg2opsize(r),ref,r);          R_MMREGISTER :            case getsubreg(r) of              R_SUBMMD:                result:=taicpu.op_ref_reg(A_MOVSD,reg2opsize(r),ref,r);              R_SUBMMS:                result:=taicpu.op_ref_reg(A_MOVSS,reg2opsize(r),ref,r);              R_SUBMMWHOLE:                result:=taicpu.op_ref_reg(A_MOVQ,S_NO,ref,r);              else                internalerror(200506043);            end;          else            internalerror(200401041);        end;      end;    function spilling_create_store(r:tregister; const ref:treference):Taicpu;      var        size: topsize;      begin        case getregtype(r) of          R_INTREGISTER :            begin              size:=reg2opsize(r);{$ifdef x86_64}              { even if it's a 32 bit reg, we still have to spill 64 bits                because we often perform 64 bit operations on them }              if (size=S_L) then                begin                  size:=S_Q;                  r:=newreg(getregtype(r),getsupreg(r),R_SUBWHOLE);                end;{$endif x86_64}              result:=taicpu.op_reg_ref(A_MOV,size,r,ref);            end;          R_MMREGISTER :            case getsubreg(r) of              R_SUBMMD:                result:=taicpu.op_reg_ref(A_MOVSD,reg2opsize(r),r,ref);              R_SUBMMS:                result:=taicpu.op_reg_ref(A_MOVSS,reg2opsize(r),r,ref);              R_SUBMMWHOLE:                result:=taicpu.op_reg_ref(A_MOVQ,S_NO,r,ref);              else                internalerror(200506042);            end;          else            internalerror(200401041);        end;      end;{*****************************************************************************                              Instruction table*****************************************************************************}    procedure BuildInsTabCache;      var        i : longint;      begin        new(instabcache);        FillChar(instabcache^,sizeof(tinstabcache),$ff);        i:=0;        while (i<InsTabEntries) do         begin           if InsTabCache^[InsTab[i].OPcode]=-1 then            InsTabCache^[InsTab[i].OPcode]:=i;           inc(i);         end;      end;    procedure BuildInsTabMemRefSizeInfoCache;    var      AsmOp: TasmOp;      i,j: longint;      insentry  : PInsEntry;      MRefInfo: TMemRefSizeInfo;      SConstInfo: TConstSizeInfo;      actRegSize: int64;      actMemSize: int64;      actConstSize: int64;      actRegCount: integer;      actMemCount: integer;      actConstCount: integer;      actRegTypes  : int64;      actRegMemTypes: int64;      NewRegSize: int64;      NewMemSize: int64;      NewConstSize: int64;      RegSize: int64;      MemSize: int64;      ConstSize: int64;      RegMMXSizeMask: int64;      RegXMMSizeMask: int64;      RegYMMSizeMask: int64;      bitcount: integer;      IsRegSizeMemSize: boolean;      ExistsRegMem: boolean;      s: string;      function bitcnt(aValue: int64): integer;      var        i: integer;      begin        result := 0;        for i := 0 to 63 do        begin          if (aValue mod 2) = 1 then          begin            inc(result);          end;          aValue := aValue shr 1;        end;      end;    begin      new(InsTabMemRefSizeInfoCache);      FillChar(InsTabMemRefSizeInfoCache^,sizeof(TInsTabMemRefSizeInfoCache),0);      for AsmOp := low(TAsmOp) to high(TAsmOp) do      begin        i := InsTabCache^[AsmOp];        if i >= 0 then        begin          InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize   := msiUnkown;          InsTabMemRefSizeInfoCache^[AsmOp].ConstSize    := csiUnkown;          InsTabMemRefSizeInfoCache^[AsmOp].ExistsSSEAVX := false;          RegSize := 0;          IsRegSizeMemSize := true;          ExistsRegMem     := false;          insentry:=@instab[i];          RegMMXSizeMask := 0;          RegXMMSizeMask := 0;          RegYMMSizeMask := 0;          while (insentry^.opcode=AsmOp) do          begin            MRefInfo         := msiUnkown;            actRegSize       := 0;            actRegCount      := 0;            actRegTypes      := 0;            NewRegSize       := 0;            actMemSize       := 0;            actMemCount      := 0;            actRegMemTypes   := 0;            NewMemSize       := 0;            actConstSize     := 0;            actConstCount    := 0;            NewConstSize     := 0;            if asmop = a_movups then            begin              RegXMMSizeMask := RegXMMSizeMask;            end;            for j := 0 to insentry^.ops -1 do            begin              if (insentry^.optypes[j] and OT_REGISTER) = OT_REGISTER then              begin                inc(actRegCount);                NewRegSize := (insentry^.optypes[j] and OT_SIZE_MASK);                if NewRegSize = 0 then                begin                  case insentry^.optypes[j] and (OT_MMXREG OR OT_XMMREG OR OT_YMMREG) of                    OT_MMXREG: begin                                 NewRegSize := OT_BITS64;                               end;                    OT_XMMREG: begin                                 NewRegSize := OT_BITS128;                                 InsTabMemRefSizeInfoCache^[AsmOp].ExistsSSEAVX := true;                               end;                    OT_YMMREG: begin                                 NewRegSize := OT_BITS256;                                 InsTabMemRefSizeInfoCache^[AsmOp].ExistsSSEAVX := true;                               end;                          else NewRegSize := not(0);                  end;                end;                actRegSize  := actRegSize or NewRegSize;                actRegTypes := actRegTypes or (insentry^.optypes[j] and (OT_MMXREG OR OT_XMMREG OR OT_YMMREG));              end              else if ((insentry^.optypes[j] and OT_MEMORY) <> 0) then              begin                inc(actMemCount);                actMemSize    := actMemSize or (insentry^.optypes[j] and OT_SIZE_MASK);                if (insentry^.optypes[j] and OT_REGMEM) = OT_REGMEM then                begin                  actRegMemTypes  := actRegMemTypes or insentry^.optypes[j];                end;              end              else if ((insentry^.optypes[j] and OT_IMMEDIATE) = OT_IMMEDIATE) then              begin                inc(actConstCount);                actConstSize    := actConstSize or (insentry^.optypes[j] and OT_SIZE_MASK);              end            end;            if actConstCount > 0 then            begin              case actConstSize of                        0: SConstInfo := csiNoSize;                 OT_BITS8: SConstInfo := csiMem8;                OT_BITS16: SConstInfo := csiMem16;                OT_BITS32: SConstInfo := csiMem32;                OT_BITS64: SConstInfo := csiMem64;                      else SConstInfo := csiMultiple;              end;              if InsTabMemRefSizeInfoCache^[AsmOp].ConstSize = csiUnkown then              begin                InsTabMemRefSizeInfoCache^[AsmOp].ConstSize := SConstInfo;              end              else if InsTabMemRefSizeInfoCache^[AsmOp].ConstSize <> SConstInfo then              begin                InsTabMemRefSizeInfoCache^[AsmOp].ConstSize := csiMultiple;              end;            end;            case actMemCount of                0: ; // nothing todo                1: begin                     MRefInfo := msiUnkown;                     case actRegMemTypes and (OT_MMXRM OR OT_XMMRM OR OT_YMMRM) of                       OT_MMXRM: actMemSize := actMemSize or OT_BITS64;                       OT_XMMRM: actMemSize := actMemSize or OT_BITS128;                       OT_YMMRM: actMemSize := actMemSize or OT_BITS256;                     end;                     case actMemSize of                                0: MRefInfo := msiNoSize;                         OT_BITS8: MRefInfo := msiMem8;                        OT_BITS16: MRefInfo := msiMem16;                        OT_BITS32: MRefInfo := msiMem32;                        OT_BITS64: MRefInfo := msiMem64;                       OT_BITS128: MRefInfo := msiMem128;                       OT_BITS256: MRefInfo := msiMem256;                       OT_BITS80,                          OT_FAR,                         OT_NEAR,                         OT_SHORT: ; // ignore                              else begin                                     bitcount := bitcnt(actMemSize);                                     if bitcount > 1 then MRefInfo := msiMultiple                                     else InternalError(777203);                                   end;                     end;                     if InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize = msiUnkown then                     begin                       InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := MRefInfo;                     end                     else if InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize <> MRefInfo then                     begin                       with InsTabMemRefSizeInfoCache^[AsmOp] do                       begin                         if ((MemRefSize = msiMem8)        OR (MRefInfo = msiMem8))   then MemRefSize := msiMultiple8                         else if ((MemRefSize = msiMem16)  OR (MRefInfo = msiMem16))  then MemRefSize := msiMultiple16                         else if ((MemRefSize = msiMem32)  OR (MRefInfo = msiMem32))  then MemRefSize := msiMultiple32                         else if ((MemRefSize = msiMem64)  OR (MRefInfo = msiMem64))  then MemRefSize := msiMultiple64                         else if ((MemRefSize = msiMem128) OR (MRefInfo = msiMem128)) then MemRefSize := msiMultiple128                         else if ((MemRefSize = msiMem256) OR (MRefInfo = msiMem256)) then MemRefSize := msiMultiple256                         else MemRefSize := msiMultiple;                       end;                     end;                     if actRegCount > 0 then                     begin                       case actRegTypes and (OT_MMXREG or OT_XMMREG or OT_YMMREG) of                         OT_MMXREG: RegMMXSizeMask := RegMMXSizeMask or actMemSize;                         OT_XMMREG: RegXMMSizeMask := RegXMMSizeMask or actMemSize;                         OT_YMMREG: RegYMMSizeMask := RegYMMSizeMask or actMemSize;                               else begin                                      RegMMXSizeMask := not(0);                                      RegXMMSizeMask := not(0);                                      RegYMMSizeMask := not(0);                                    end;                       end;                     end;                   end;              else InternalError(777202);            end;            inc(insentry);          end;          if (InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize in MemRefMultiples) and             (InsTabMemRefSizeInfoCache^[AsmOp].ExistsSSEAVX)then          begin            case RegXMMSizeMask of               OT_BITS64: case RegYMMSizeMask of                            OT_BITS128: InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiMemRegx64y128;                            OT_BITS256: InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiMemRegx64y256;                          end;              OT_BITS128: begin                            if RegMMXSizeMask = 0 then                            begin                              case RegYMMSizeMask of                                OT_BITS128: InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiMemRegx64y128;                                OT_BITS256: InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiMemRegSize;                              end;                            end                            else if RegYMMSizeMask = 0 then                            begin                              case RegMMXSizeMask of                                OT_BITS64: InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize := msiMemRegSize;                              end;                            end                            else InternalError(777205);                          end;            end;          end;        end;      end;      for AsmOp := low(TAsmOp) to high(TAsmOp) do      begin        // only supported intructiones with SSE- or AVX-operands        if not(InsTabMemRefSizeInfoCache^[AsmOp].ExistsSSEAVX) then        begin          InsTabMemRefSizeInfoCache^[AsmOp].MemRefSize  := msiUnkown;          InsTabMemRefSizeInfoCache^[AsmOp].ConstSize   := csiUnkown;        end;      end;    end;    procedure InitAsm;      begin        build_spilling_operation_type_table;        if not assigned(instabcache) then          BuildInsTabCache;        if not assigned(InsTabMemRefSizeInfoCache) then          BuildInsTabMemRefSizeInfoCache;      end;    procedure DoneAsm;      begin        if assigned(operation_type_table) then          begin            dispose(operation_type_table);            operation_type_table:=nil;          end;        if assigned(instabcache) then          begin            dispose(instabcache);            instabcache:=nil;          end;        if assigned(InsTabMemRefSizeInfoCache) then        begin          dispose(InsTabMemRefSizeInfoCache);          InsTabMemRefSizeInfoCache:=nil;        end;      end;begin  cai_align:=tai_align;  cai_cpu:=taicpu;end.
 |