| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607 | {    Copyright (c) 1998-2002 by Florian Klaempfl and Peter Vreman    Contains the abstract assembler implementation for the i386    * Portions of this code was inspired by the NASM sources      The Netwide Assembler is Copyright (c) 1996 Simon Tatham and      Julian Hall. All rights reserved.    This program is free software; you can redistribute it and/or modify    it under the terms of the GNU General Public License as published by    the Free Software Foundation; either version 2 of the License, or    (at your option) any later version.    This program is distributed in the hope that it will be useful,    but WITHOUT ANY WARRANTY; without even the implied warranty of    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the    GNU General Public License for more details.    You should have received a copy of the GNU General Public License    along with this program; if not, write to the Free Software    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. ****************************************************************************}unit aasmcpu;{$i fpcdefs.inc}interface    uses      globtype,verbose,      cpubase,      cgbase,cgutils,      symtype,      aasmbase,aasmtai,aasmdata,aasmsym,      ogbase;    const      { "mov reg,reg" source operand number }      O_MOV_SOURCE = 0;      { "mov reg,reg" destination operand number }      O_MOV_DEST = 1;    { Operand types }      OT_NONE      = $00000000;      { Bits 0..7: sizes }      OT_BITS8     = $00000001;      OT_BITS16    = $00000002;      OT_BITS32    = $00000004;      OT_BITS64    = $00000008;  { x86_64 and FPU }      OT_BITS80    = $00000010;  { FPU only  }      OT_FAR       = $00000020;  { this means 16:16 or 16:32, like in CALL/JMP }      OT_NEAR      = $00000040;      OT_SHORT     = $00000080;      { TODO: FAR/NEAR/SHORT are sizes too, they should be included into size mask,        but this requires adjusting the opcode table }      OT_SIZE_MASK = $0000001F;  { all the size attributes  }      OT_NON_SIZE  = longint(not OT_SIZE_MASK);      { Bits 8..11: modifiers }      OT_SIGNED    = $00000100;  { the operand need to be signed -128-127 }      OT_TO        = $00000200;  { reverse effect in FADD, FSUB &c  }      OT_COLON     = $00000400;  { operand is followed by a colon  }      OT_MODIFIER_MASK = $00000F00;      { Bits 12..15: type of operand }      OT_REGISTER  = $00001000;      OT_IMMEDIATE = $00002000;      OT_MEMORY    = $0000C000;  { always includes 'OT_REGMEM' bit as well }      OT_REGMEM    = $00008000;  { for r/m, ie EA, operands  }      OT_TYPE_MASK = OT_REGISTER or OT_IMMEDIATE or OT_MEMORY or OT_REGMEM;      OT_REGNORM   = OT_REGISTER or OT_REGMEM;  { 'normal' reg, qualifies as EA  }      { Bits 20..22, 24..26: register classes        otf_* consts are not used alone, only to build other constants. }      otf_reg_cdt  = $00100000;      otf_reg_gpr  = $00200000;      otf_reg_sreg = $00400000;      otf_reg_fpu  = $01000000;      otf_reg_mmx  = $02000000;      otf_reg_xmm  = $04000000;      { Bits 16..19: subclasses, meaning depends on classes field }      otf_sub0     = $00010000;      otf_sub1     = $00020000;      otf_sub2     = $00040000;      otf_sub3     = $00080000;      OT_REG_SMASK = otf_sub0 or otf_sub1 or otf_sub2 or otf_sub3;      { register class 0: CRx, DRx and TRx }      OT_REG_CDT   = OT_REGISTER or otf_reg_cdt or OT_BITS32;      OT_REG_CREG  = OT_REG_CDT or otf_sub0;  { CRn  }      OT_REG_DREG  = OT_REG_CDT or otf_sub1;  { DRn  }      OT_REG_TREG  = OT_REG_CDT or otf_sub2;  { TRn  }      OT_REG_CR4   = OT_REG_CDT or otf_sub3;  { CR4 (Pentium only)  }      { register class 1: general-purpose registers }      OT_REG_GPR   = OT_REGNORM or otf_reg_gpr;      OT_RM_GPR    = OT_REGMEM or otf_reg_gpr;      OT_REG8      = OT_REG_GPR or OT_BITS8;  { 8-bit GPR }      OT_REG16     = OT_REG_GPR or OT_BITS16;      OT_REG32     = OT_REG_GPR or OT_BITS32;      OT_REG64     = OT_REG_GPR or OT_BITS64;      { GPR subclass 0: accumulator: AL, AX, EAX or RAX }      OT_REG_ACCUM = OT_REG_GPR or otf_sub0;      OT_REG_AL    = OT_REG_ACCUM or OT_BITS8;      OT_REG_AX    = OT_REG_ACCUM or OT_BITS16;      OT_REG_EAX   = OT_REG_ACCUM or OT_BITS32;{$ifdef x86_64}      OT_REG_RAX   = OT_REG_ACCUM or OT_BITS64;{$endif x86_64}      { GPR subclass 1: counter: CL, CX, ECX or RCX }      OT_REG_COUNT = OT_REG_GPR or otf_sub1;      OT_REG_CL    = OT_REG_COUNT or OT_BITS8;      OT_REG_CX    = OT_REG_COUNT or OT_BITS16;      OT_REG_ECX   = OT_REG_COUNT or OT_BITS32;{$ifdef x86_64}      OT_REG_RCX   = OT_REG_COUNT or OT_BITS64;{$endif x86_64}      { GPR subclass 2: data register: DL, DX, EDX or RDX }      OT_REG_DX    = OT_REG_GPR or otf_sub2 or OT_BITS16;      OT_REG_EDX   = OT_REG_GPR or otf_sub2 or OT_BITS32;      { register class 2: Segment registers }      OT_REG_SREG  = OT_REGISTER or otf_reg_sreg or OT_BITS16;      OT_REG_CS    = OT_REG_SREG or otf_sub0;  { CS  }      OT_REG_DESS  = OT_REG_SREG or otf_sub1;  { DS, ES, SS (non-CS 86 registers)  }      OT_REG_FSGS  = OT_REG_SREG or otf_sub2;  { FS, GS (386 extended registers)  }      { register class 3: FPU registers }      OT_FPUREG    = OT_REGISTER or otf_reg_fpu;      OT_FPU0      = OT_FPUREG or otf_sub0;    { FPU stack register zero  }      { register class 4: MMX (both reg and r/m) }      OT_MMXREG    = OT_REGNORM or otf_reg_mmx;      OT_MMXRM     = OT_REGMEM or otf_reg_mmx;      { register class 5: XMM (both reg and r/m) }      OT_XMMREG    = OT_REGNORM or otf_reg_xmm;      OT_XMMRM     = OT_REGMEM or otf_reg_xmm;      { Memory operands }      OT_MEM8      = OT_MEMORY or OT_BITS8;      OT_MEM16     = OT_MEMORY or OT_BITS16;      OT_MEM32     = OT_MEMORY or OT_BITS32;      OT_MEM64     = OT_MEMORY or OT_BITS64;      OT_MEM80     = OT_MEMORY or OT_BITS80;      OT_MEM_OFFS  = OT_MEMORY or otf_sub0;  { special type of EA  }                                             { simple [address] offset  }      { Matches any type of r/m operand }      OT_MEMORY_ANY = OT_MEMORY or OT_RM_GPR or OT_XMMRM or OT_MMXRM;      { Immediate operands }      OT_IMM8      = OT_IMMEDIATE or OT_BITS8;      OT_IMM16     = OT_IMMEDIATE or OT_BITS16;      OT_IMM32     = OT_IMMEDIATE or OT_BITS32;      OT_IMM64     = OT_IMMEDIATE or OT_BITS64;      OT_ONENESS   = otf_sub0;  { special type of immediate operand  }      OT_UNITY     = OT_IMMEDIATE or OT_ONENESS;  { for shift/rotate instructions  }      { Size of the instruction table converted by nasmconv.pas }{$ifdef x86_64}      instabentries = {$i x8664nop.inc}{$else x86_64}      instabentries = {$i i386nop.inc}{$endif x86_64}      maxinfolen    = 8;      MaxInsChanges = 3; { Max things a instruction can change }    type      { What an instruction can change. Needed for optimizer and spilling code.        Note: The order of this enumeration is should not be changed! }      TInsChange = (Ch_None,        {Read from a register}        Ch_REAX, Ch_RECX, Ch_REDX, Ch_REBX, Ch_RESP, Ch_REBP, Ch_RESI, Ch_REDI,        {write from a register}        Ch_WEAX, Ch_WECX, Ch_WEDX, Ch_WEBX, Ch_WESP, Ch_WEBP, Ch_WESI, Ch_WEDI,        {read and write from/to a register}        Ch_RWEAX, Ch_RWECX, Ch_RWEDX, Ch_RWEBX, Ch_RWESP, Ch_RWEBP, Ch_RWESI, Ch_RWEDI,        {modify the contents of a register with the purpose of using         this changed content afterwards (add/sub/..., but e.g. not rep         or movsd)}        Ch_MEAX, Ch_MECX, Ch_MEDX, Ch_MEBX, Ch_MESP, Ch_MEBP, Ch_MESI, Ch_MEDI,        Ch_CDirFlag {clear direction flag}, Ch_SDirFlag {set dir flag},        Ch_RFlags, Ch_WFlags, Ch_RWFlags, Ch_FPU,        Ch_Rop1, Ch_Wop1, Ch_RWop1,Ch_Mop1,        Ch_Rop2, Ch_Wop2, Ch_RWop2,Ch_Mop2,        Ch_Rop3, Ch_WOp3, Ch_RWOp3,Ch_Mop3,        Ch_WMemEDI,        Ch_All,        { x86_64 registers }        Ch_RRAX, Ch_RRCX, Ch_RRDX, Ch_RRBX, Ch_RRSP, Ch_RRBP, Ch_RRSI, Ch_RRDI,        Ch_WRAX, Ch_WRCX, Ch_WRDX, Ch_WRBX, Ch_WRSP, Ch_WRBP, Ch_WRSI, Ch_WRDI,        Ch_RWRAX, Ch_RWRCX, Ch_RWRDX, Ch_RWRBX, Ch_RWRSP, Ch_RWRBP, Ch_RWRSI, Ch_RWRDI,        Ch_MRAX, Ch_MRCX, Ch_MRDX, Ch_MRBX, Ch_MRSP, Ch_MRBP, Ch_MRSI, Ch_MRDI      );      TInsProp = packed record        Ch : Array[1..MaxInsChanges] of TInsChange;      end;    const      InsProp : array[tasmop] of TInsProp ={$ifdef x86_64}        {$i x8664pro.inc}{$else x86_64}        {$i i386prop.inc}{$endif x86_64}    type      TOperandOrder = (op_intel,op_att);      tinsentry=packed record        opcode  : tasmop;        ops     : byte;        optypes : array[0..2] of longint;        code    : array[0..maxinfolen] of char;        flags   : cardinal;      end;      pinsentry=^tinsentry;      { alignment for operator }      tai_align = class(tai_align_abstract)         reg       : tregister;         constructor create(b:byte);override;         constructor create_op(b: byte; _op: byte);override;         function calculatefillbuf(var buf : tfillbuffer;executable : boolean):pchar;override;      end;      taicpu = class(tai_cpu_abstract_sym)         opsize    : topsize;         constructor op_none(op : tasmop);         constructor op_none(op : tasmop;_size : topsize);         constructor op_reg(op : tasmop;_size : topsize;_op1 : tregister);         constructor op_const(op : tasmop;_size : topsize;_op1 : aint);         constructor op_ref(op : tasmop;_size : topsize;const _op1 : treference);         constructor op_reg_reg(op : tasmop;_size : topsize;_op1,_op2 : tregister);         constructor op_reg_ref(op : tasmop;_size : topsize;_op1 : tregister;const _op2 : treference);         constructor op_reg_const(op:tasmop; _size: topsize; _op1: tregister; _op2: aint);         constructor op_const_reg(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister);         constructor op_const_const(op : tasmop;_size : topsize;_op1,_op2 : aint);         constructor op_const_ref(op : tasmop;_size : topsize;_op1 : aint;const _op2 : treference);         constructor op_ref_reg(op : tasmop;_size : topsize;const _op1 : treference;_op2 : tregister);         constructor op_reg_reg_reg(op : tasmop;_size : topsize;_op1,_op2,_op3 : tregister);         constructor op_const_reg_reg(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister;_op3 : tregister);         constructor op_const_ref_reg(op : tasmop;_size : topsize;_op1 : aint;const _op2 : treference;_op3 : tregister);         constructor op_reg_reg_ref(op : tasmop;_size : topsize;_op1,_op2 : tregister; const _op3 : treference);         constructor op_const_reg_ref(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister;const _op3 : treference);         { this is for Jmp instructions }         constructor op_cond_sym(op : tasmop;cond:TAsmCond;_size : topsize;_op1 : tasmsymbol);         constructor op_sym(op : tasmop;_size : topsize;_op1 : tasmsymbol);         constructor op_sym_ofs(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint);         constructor op_sym_ofs_reg(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint;_op2 : tregister);         constructor op_sym_ofs_ref(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint;const _op2 : treference);         procedure changeopsize(siz:topsize);         function  GetString:string;         procedure CheckNonCommutativeOpcodes;      private         FOperandOrder : TOperandOrder;         procedure init(_size : topsize); { this need to be called by all constructor }      public         { the next will reset all instructions that can change in pass 2 }         procedure ResetPass1;override;         procedure ResetPass2;override;         function  CheckIfValid:boolean;         function  Pass1(objdata:TObjData):longint;override;         procedure Pass2(objdata:TObjData);override;         procedure SetOperandOrder(order:TOperandOrder);         function is_same_reg_move(regtype: Tregistertype):boolean;override;         { register spilling code }         function spilling_get_operation_type(opnr: longint): topertype;override;      private         { next fields are filled in pass1, so pass2 is faster }         insentry  : PInsEntry;         insoffset : longint;         LastInsOffset : longint; { need to be public to be reset }         inssize   : shortint;{$ifdef x86_64}         rex       : byte;{$endif x86_64}         function  InsEnd:longint;         procedure create_ot(objdata:TObjData);         function  Matches(p:PInsEntry):boolean;         function  calcsize(p:PInsEntry):shortint;         procedure gencode(objdata:TObjData);         function  NeedAddrPrefix(opidx:byte):boolean;         procedure Swapoperands;         function  FindInsentry(objdata:TObjData):boolean;      end;    function spilling_create_load(const ref:treference;r:tregister):Taicpu;    function spilling_create_store(r:tregister; const ref:treference):Taicpu;    procedure InitAsm;    procedure DoneAsm;implementation     uses       cutils,       globals,       systems,       procinfo,       itcpugas,       symsym;{*****************************************************************************                              Instruction table*****************************************************************************}    const     {Instruction flags }       IF_NONE   = $00000000;       IF_SM     = $00000001;  { size match first two operands  }       IF_SM2    = $00000002;       IF_SB     = $00000004;  { unsized operands can't be non-byte  }       IF_SW     = $00000008;  { unsized operands can't be non-word  }       IF_SD     = $00000010;  { unsized operands can't be nondword  }       IF_SMASK  = $0000001f;       IF_AR0    = $00000020;  { SB, SW, SD applies to argument 0  }       IF_AR1    = $00000040;  { SB, SW, SD applies to argument 1  }       IF_AR2    = $00000060;  { SB, SW, SD applies to argument 2  }       IF_ARMASK = $00000060;  { mask for unsized argument spec  }       IF_ARSHIFT = 5;         { LSB of IF_ARMASK }       IF_PRIV   = $00000100;  { it's a privileged instruction  }       IF_SMM    = $00000200;  { it's only valid in SMM  }       IF_PROT   = $00000400;  { it's protected mode only  }       IF_NOX86_64 = $00000800;  { removed instruction in x86_64  }       IF_UNDOC  = $00001000;  { it's an undocumented instruction  }       IF_FPU    = $00002000;  { it's an FPU instruction  }       IF_MMX    = $00004000;  { it's an MMX instruction  }       { it's a 3DNow! instruction  }       IF_3DNOW  = $00008000;       { it's a SSE (KNI, MMX2) instruction  }       IF_SSE    = $00010000;       { SSE2 instructions  }       IF_SSE2   = $00020000;       { SSE3 instructions  }       IF_SSE3   = $00040000;       { SSE64 instructions  }       IF_SSE64  = $00080000;       { the mask for processor types  }       {IF_PMASK  = longint($FF000000);}       { the mask for disassembly "prefer"  }       {IF_PFMASK = longint($F001FF00);}       { SVM instructions  }       IF_SVM    = $00100000;       { SSE4 instructions  }       IF_SSE4   = $00200000;       { TODO: These flags were added to make x86ins.dat more readable.         Values must be reassigned to make any other use of them. }       IF_SSSE3  = $00200000;       IF_SSE41  = $00200000;       IF_SSE42  = $00200000;       IF_8086   = $00000000;  { 8086 instruction  }       IF_186    = $01000000;  { 186+ instruction  }       IF_286    = $02000000;  { 286+ instruction  }       IF_386    = $03000000;  { 386+ instruction  }       IF_486    = $04000000;  { 486+ instruction  }       IF_PENT   = $05000000;  { Pentium instruction  }       IF_P6     = $06000000;  { P6 instruction  }       IF_KATMAI = $07000000;  { Katmai instructions  }       { Willamette instructions }       IF_WILLAMETTE = $08000000;       { Prescott instructions }       IF_PRESCOTT = $09000000;       IF_X86_64 = $0a000000;       IF_CYRIX  = $0b000000;  { Cyrix-specific instruction  }       IF_AMD    = $0c000000;  { AMD-specific instruction  }       IF_CENTAUR = $0d000000;  { centaur-specific instruction  }       { added flags }       IF_PRE    = $40000000;  { it's a prefix instruction }       IF_PASS2  = $80000000;  { if the instruction can change in a second pass }     type       TInsTabCache=array[TasmOp] of longint;       PInsTabCache=^TInsTabCache;     const{$ifdef x86_64}       InsTab:array[0..instabentries-1] of TInsEntry={$i x8664tab.inc}{$else x86_64}       InsTab:array[0..instabentries-1] of TInsEntry={$i i386tab.inc}{$endif x86_64}     var       InsTabCache : PInsTabCache;     const{$ifdef x86_64}       { Intel style operands ! }       opsize_2_type:array[0..2,topsize] of longint=(         (OT_NONE,          OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS16,OT_BITS32,OT_BITS32,OT_BITS64,OT_BITS64,OT_BITS64,          OT_BITS16,OT_BITS32,OT_BITS64,          OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,          OT_BITS64,          OT_NEAR,OT_FAR,OT_SHORT,          OT_NONE,          OT_NONE         ),         (OT_NONE,          OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS8,OT_BITS8,OT_BITS16,OT_BITS8,OT_BITS16,OT_BITS32,          OT_BITS16,OT_BITS32,OT_BITS64,          OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,          OT_BITS64,          OT_NEAR,OT_FAR,OT_SHORT,          OT_NONE,          OT_NONE         ),         (OT_NONE,          OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_NONE,OT_NONE,OT_NONE,OT_NONE,OT_NONE,OT_NONE,          OT_BITS16,OT_BITS32,OT_BITS64,          OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,          OT_BITS64,          OT_NEAR,OT_FAR,OT_SHORT,          OT_NONE,          OT_NONE         )       );      reg_ot_table : array[tregisterindex] of longint = (        {$i r8664ot.inc}      );{$else x86_64}       { Intel style operands ! }       opsize_2_type:array[0..2,topsize] of longint=(         (OT_NONE,          OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS16,OT_BITS32,OT_BITS32,          OT_BITS16,OT_BITS32,OT_BITS64,          OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,          OT_BITS64,          OT_NEAR,OT_FAR,OT_SHORT,          OT_NONE,          OT_NONE         ),         (OT_NONE,          OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_BITS8,OT_BITS8,OT_BITS16,          OT_BITS16,OT_BITS32,OT_BITS64,          OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,          OT_BITS64,          OT_NEAR,OT_FAR,OT_SHORT,          OT_NONE,          OT_NONE         ),         (OT_NONE,          OT_BITS8,OT_BITS16,OT_BITS32,OT_BITS64,OT_NONE,OT_NONE,OT_NONE,          OT_BITS16,OT_BITS32,OT_BITS64,          OT_BITS32,OT_BITS64,OT_BITS80,OT_BITS64,OT_NONE,          OT_BITS64,          OT_NEAR,OT_FAR,OT_SHORT,          OT_NONE,          OT_NONE         )      );      reg_ot_table : array[tregisterindex] of longint = (        {$i r386ot.inc}      );{$endif x86_64}    { Operation type for spilling code }    type      toperation_type_table=array[tasmop,0..Max_Operands] of topertype;    var      operation_type_table : ^toperation_type_table;{****************************************************************************                              TAI_ALIGN ****************************************************************************}    constructor tai_align.create(b: byte);      begin        inherited create(b);        reg:=NR_ECX;      end;    constructor tai_align.create_op(b: byte; _op: byte);      begin        inherited create_op(b,_op);        reg:=NR_NO;      end;    function tai_align.calculatefillbuf(var buf : tfillbuffer;executable : boolean):pchar;      const{$ifdef x86_64}        alignarray:array[0..3] of string[4]=(          #$66#$66#$66#$90,          #$66#$66#$90,          #$66#$90,          #$90        );{$else x86_64}        alignarray:array[0..5] of string[8]=(          #$8D#$B4#$26#$00#$00#$00#$00,          #$8D#$B6#$00#$00#$00#$00,          #$8D#$74#$26#$00,          #$8D#$76#$00,          #$89#$F6,          #$90);{$endif x86_64}      var        bufptr : pchar;        j : longint;        localsize: byte;      begin        inherited calculatefillbuf(buf,executable);        if not(use_op) and executable then         begin           bufptr:=pchar(@buf);           { fillsize may still be used afterwards, so don't modify }           { e.g. writebytes(hp.calculatefillbuf(buf)^,hp.fillsize) }           localsize:=fillsize;           while (localsize>0) do            begin              for j:=low(alignarray) to high(alignarray) do               if (localsize>=length(alignarray[j])) then                break;              move(alignarray[j][1],bufptr^,length(alignarray[j]));              inc(bufptr,length(alignarray[j]));              dec(localsize,length(alignarray[j]));            end;         end;        calculatefillbuf:=pchar(@buf);      end;{*****************************************************************************                                 Taicpu Constructors*****************************************************************************}    procedure taicpu.changeopsize(siz:topsize);      begin        opsize:=siz;      end;    procedure taicpu.init(_size : topsize);      begin         { default order is att }         FOperandOrder:=op_att;         segprefix:=NR_NO;         opsize:=_size;         insentry:=nil;         LastInsOffset:=-1;         InsOffset:=0;         InsSize:=0;      end;    constructor taicpu.op_none(op : tasmop);      begin         inherited create(op);         init(S_NO);      end;    constructor taicpu.op_none(op : tasmop;_size : topsize);      begin         inherited create(op);         init(_size);      end;    constructor taicpu.op_reg(op : tasmop;_size : topsize;_op1 : tregister);      begin         inherited create(op);         init(_size);         ops:=1;         loadreg(0,_op1);      end;    constructor taicpu.op_const(op : tasmop;_size : topsize;_op1 : aint);      begin         inherited create(op);         init(_size);         ops:=1;         loadconst(0,_op1);      end;    constructor taicpu.op_ref(op : tasmop;_size : topsize;const _op1 : treference);      begin         inherited create(op);         init(_size);         ops:=1;         loadref(0,_op1);      end;    constructor taicpu.op_reg_reg(op : tasmop;_size : topsize;_op1,_op2 : tregister);      begin         inherited create(op);         init(_size);         ops:=2;         loadreg(0,_op1);         loadreg(1,_op2);      end;    constructor taicpu.op_reg_const(op:tasmop; _size: topsize; _op1: tregister; _op2: aint);      begin         inherited create(op);         init(_size);         ops:=2;         loadreg(0,_op1);         loadconst(1,_op2);      end;    constructor taicpu.op_reg_ref(op : tasmop;_size : topsize;_op1 : tregister;const _op2 : treference);      begin         inherited create(op);         init(_size);         ops:=2;         loadreg(0,_op1);         loadref(1,_op2);      end;    constructor taicpu.op_const_reg(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister);      begin         inherited create(op);         init(_size);         ops:=2;         loadconst(0,_op1);         loadreg(1,_op2);      end;    constructor taicpu.op_const_const(op : tasmop;_size : topsize;_op1,_op2 : aint);      begin         inherited create(op);         init(_size);         ops:=2;         loadconst(0,_op1);         loadconst(1,_op2);      end;    constructor taicpu.op_const_ref(op : tasmop;_size : topsize;_op1 : aint;const _op2 : treference);      begin         inherited create(op);         init(_size);         ops:=2;         loadconst(0,_op1);         loadref(1,_op2);      end;    constructor taicpu.op_ref_reg(op : tasmop;_size : topsize;const _op1 : treference;_op2 : tregister);      begin         inherited create(op);         init(_size);         ops:=2;         loadref(0,_op1);         loadreg(1,_op2);      end;    constructor taicpu.op_reg_reg_reg(op : tasmop;_size : topsize;_op1,_op2,_op3 : tregister);      begin         inherited create(op);         init(_size);         ops:=3;         loadreg(0,_op1);         loadreg(1,_op2);         loadreg(2,_op3);      end;    constructor taicpu.op_const_reg_reg(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister;_op3 : tregister);      begin         inherited create(op);         init(_size);         ops:=3;         loadconst(0,_op1);         loadreg(1,_op2);         loadreg(2,_op3);      end;    constructor taicpu.op_reg_reg_ref(op : tasmop;_size : topsize;_op1,_op2 : tregister;const _op3 : treference);      begin         inherited create(op);         init(_size);         ops:=3;         loadreg(0,_op1);         loadreg(1,_op2);         loadref(2,_op3);      end;    constructor taicpu.op_const_ref_reg(op : tasmop;_size : topsize;_op1 : aint;const _op2 : treference;_op3 : tregister);      begin         inherited create(op);         init(_size);         ops:=3;         loadconst(0,_op1);         loadref(1,_op2);         loadreg(2,_op3);      end;    constructor taicpu.op_const_reg_ref(op : tasmop;_size : topsize;_op1 : aint;_op2 : tregister;const _op3 : treference);      begin         inherited create(op);         init(_size);         ops:=3;         loadconst(0,_op1);         loadreg(1,_op2);         loadref(2,_op3);      end;    constructor taicpu.op_cond_sym(op : tasmop;cond:TAsmCond;_size : topsize;_op1 : tasmsymbol);      begin         inherited create(op);         init(_size);         condition:=cond;         ops:=1;         loadsymbol(0,_op1,0);      end;    constructor taicpu.op_sym(op : tasmop;_size : topsize;_op1 : tasmsymbol);      begin         inherited create(op);         init(_size);         ops:=1;         loadsymbol(0,_op1,0);      end;    constructor taicpu.op_sym_ofs(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint);      begin         inherited create(op);         init(_size);         ops:=1;         loadsymbol(0,_op1,_op1ofs);      end;    constructor taicpu.op_sym_ofs_reg(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint;_op2 : tregister);      begin         inherited create(op);         init(_size);         ops:=2;         loadsymbol(0,_op1,_op1ofs);         loadreg(1,_op2);      end;    constructor taicpu.op_sym_ofs_ref(op : tasmop;_size : topsize;_op1 : tasmsymbol;_op1ofs:longint;const _op2 : treference);      begin         inherited create(op);         init(_size);         ops:=2;         loadsymbol(0,_op1,_op1ofs);         loadref(1,_op2);      end;    function taicpu.GetString:string;      var        i : longint;        s : string;        addsize : boolean;      begin        s:='['+std_op2str[opcode];        for i:=0 to ops-1 do         begin           with oper[i]^ do             begin               if i=0 then                s:=s+' '               else                s:=s+',';               { type }               addsize:=false;               if (ot and OT_XMMREG)=OT_XMMREG then                s:=s+'xmmreg'               else                 if (ot and OT_MMXREG)=OT_MMXREG then                  s:=s+'mmxreg'               else                 if (ot and OT_FPUREG)=OT_FPUREG then                  s:=s+'fpureg'               else                if (ot and OT_REGISTER)=OT_REGISTER then                 begin                   s:=s+'reg';                   addsize:=true;                 end               else                if (ot and OT_IMMEDIATE)=OT_IMMEDIATE then                 begin                   s:=s+'imm';                   addsize:=true;                 end               else                if (ot and OT_MEMORY)=OT_MEMORY then                 begin                   s:=s+'mem';                   addsize:=true;                 end               else                 s:=s+'???';               { size }               if addsize then                begin                  if (ot and OT_BITS8)<>0 then                    s:=s+'8'                  else                   if (ot and OT_BITS16)<>0 then                    s:=s+'16'                  else                   if (ot and OT_BITS32)<>0 then                    s:=s+'32'                  else                   if (ot and OT_BITS64)<>0 then                    s:=s+'64'                  else                    s:=s+'??';                  { signed }                  if (ot and OT_SIGNED)<>0 then                   s:=s+'s';                end;             end;         end;        GetString:=s+']';      end;    procedure taicpu.Swapoperands;      var        p : POper;      begin        { Fix the operands which are in AT&T style and we need them in Intel style }        case ops of          2 : begin                { 0,1 -> 1,0 }                p:=oper[0];                oper[0]:=oper[1];                oper[1]:=p;              end;          3 : begin                { 0,1,2 -> 2,1,0 }                p:=oper[0];                oper[0]:=oper[2];                oper[2]:=p;              end;        end;      end;    procedure taicpu.SetOperandOrder(order:TOperandOrder);      begin        if FOperandOrder<>order then         begin           Swapoperands;           FOperandOrder:=order;         end;      end;    procedure taicpu.CheckNonCommutativeOpcodes;      begin        { we need ATT order }        SetOperandOrder(op_att);        if (            (ops=2) and            (oper[0]^.typ=top_reg) and            (oper[1]^.typ=top_reg) and           { if the first is ST and the second is also a register             it is necessarily ST1 .. ST7 }            ((oper[0]^.reg=NR_ST) or             (oper[0]^.reg=NR_ST0))           ) or           { ((ops=1) and            (oper[0]^.typ=top_reg) and            (oper[0]^.reg in [R_ST1..R_ST7]))  or}           (ops=0) then          begin            if opcode=A_FSUBR then              opcode:=A_FSUB            else if opcode=A_FSUB then              opcode:=A_FSUBR            else if opcode=A_FDIVR then              opcode:=A_FDIV            else if opcode=A_FDIV then              opcode:=A_FDIVR            else if opcode=A_FSUBRP then              opcode:=A_FSUBP            else if opcode=A_FSUBP then              opcode:=A_FSUBRP            else if opcode=A_FDIVRP then              opcode:=A_FDIVP            else if opcode=A_FDIVP then              opcode:=A_FDIVRP;          end;        if (            (ops=1) and            (oper[0]^.typ=top_reg) and            (getregtype(oper[0]^.reg)=R_FPUREGISTER) and            (oper[0]^.reg<>NR_ST)           ) then         begin           if opcode=A_FSUBRP then             opcode:=A_FSUBP           else if opcode=A_FSUBP then             opcode:=A_FSUBRP           else if opcode=A_FDIVRP then             opcode:=A_FDIVP           else if opcode=A_FDIVP then             opcode:=A_FDIVRP;         end;      end;{*****************************************************************************                                Assembler*****************************************************************************}    type      ea = packed record        sib_present : boolean;        bytes : byte;        size  : byte;        modrm : byte;        sib   : byte;{$ifdef x86_64}        rex   : byte;{$endif x86_64}      end;    procedure taicpu.create_ot(objdata:TObjData);      {        this function will also fix some other fields which only needs to be once      }      var        i,l,relsize : longint;        currsym : TObjSymbol;      begin        if ops=0 then         exit;        { update oper[].ot field }        for i:=0 to ops-1 do         with oper[i]^ do          begin            case typ of              top_reg :                begin                  ot:=reg_ot_table[findreg_by_number(reg)];                end;              top_ref :                begin                  if (ref^.refaddr=addr_no){$ifdef i386}                     or (                         (ref^.refaddr in [addr_pic]) and                         { allow any base for assembler blocks }                        ((assigned(current_procinfo) and                         (pi_has_assembler_block in current_procinfo.flags) and                         (ref^.base<>NR_NO)) or (ref^.base=NR_EBX))                        ){$endif i386}{$ifdef x86_64}                     or (                         (ref^.refaddr in [addr_pic,addr_pic_no_got]) and                         (ref^.base<>NR_NO)                        ){$endif x86_64}                     then                    begin                      { create ot field }                      if (ot and OT_SIZE_MASK)=0 then                        ot:=OT_MEMORY_ANY or opsize_2_type[i,opsize]                      else                        ot:=OT_MEMORY_ANY or (ot and OT_SIZE_MASK);                      if (ref^.base=NR_NO) and (ref^.index=NR_NO) then                        ot:=ot or OT_MEM_OFFS;                      { fix scalefactor }                      if (ref^.index=NR_NO) then                       ref^.scalefactor:=0                      else                       if (ref^.scalefactor=0) then                        ref^.scalefactor:=1;                    end                  else                    begin                      { Jumps use a relative offset which can be 8bit,                        for other opcodes we always need to generate the full                        32bit address }                      if assigned(objdata) and                         is_jmp then                        begin                          currsym:=objdata.symbolref(ref^.symbol);                          l:=ref^.offset;                          if assigned(currsym) then                            inc(l,currsym.address);                          { when it is a forward jump we need to compensate the                            offset of the instruction since the previous time,                            because the symbol address is then still using the                            'old-style' addressing.                            For backwards jumps this is not required because the                            address of the symbol is already adjusted to the                            new offset }                          if (l>InsOffset) and (LastInsOffset<>-1) then                            inc(l,InsOffset-LastInsOffset);                          { instruction size will then always become 2 (PFV) }                          relsize:=(InsOffset+2)-l;                          if (relsize>=-128) and (relsize<=127) and                             (                              not assigned(currsym) or                              (currsym.objsection=objdata.currobjsec)                             ) then                            ot:=OT_IMM8 or OT_SHORT                          else                            ot:=OT_IMM32 or OT_NEAR;                        end                      else                        ot:=OT_IMM32 or OT_NEAR;                    end;                end;              top_local :                begin                  if (ot and OT_SIZE_MASK)=0 then                    ot:=OT_MEMORY or opsize_2_type[i,opsize]                  else                    ot:=OT_MEMORY or (ot and OT_SIZE_MASK);                end;              top_const :                begin                  { allow 2nd or 3rd operand being a constant and expect no size for shuf* etc. }                  { further, allow AAD and AAM with imm. operand }                  if (opsize=S_NO) and not((i in [1,2]) or ((i=0) and (opcode in [A_AAD,A_AAM]))) then                    message(asmr_e_invalid_opcode_and_operand);                  if (opsize<>S_W) and (aint(val)>=-128) and (val<=127) then                    ot:=OT_IMM8 or OT_SIGNED                  else                    ot:=OT_IMMEDIATE or opsize_2_type[i,opsize];                  if (val=1) and (i=1) then                    ot := ot or OT_ONENESS;                end;              top_none :                begin                  { generated when there was an error in the                    assembler reader. It never happends when generating                    assembler }                end;              else                internalerror(200402261);            end;          end;      end;    function taicpu.InsEnd:longint;      begin        InsEnd:=InsOffset+InsSize;      end;      function taicpu.Matches(p:PInsEntry):boolean;      { * IF_SM stands for Size Match: any operand whose size is not       * explicitly specified by the template is `really' intended to be       * the same size as the first size-specified operand.       * Non-specification is tolerated in the input instruction, but       * _wrong_ specification is not.       *       * IF_SM2 invokes Size Match on only the first _two_ operands, for       * three-operand instructions such as SHLD: it implies that the       * first two operands must match in size, but that the third is       * required to be _unspecified_.       *       * IF_SB invokes Size Byte: operands with unspecified size in the       * template are really bytes, and so no non-byte specification in       * the input instruction will be tolerated. IF_SW similarly invokes       * Size Word, and IF_SD invokes Size Doubleword.       *       * (The default state if neither IF_SM nor IF_SM2 is specified is       * that any operand with unspecified size in the template is       * required to have unspecified size in the instruction too...)      }      var        insot,        currot,        i,j,asize,oprs : longint;        insflags:cardinal;        siz : array[0..2] of longint;      begin        result:=false;        { Check the opcode and operands }        if (p^.opcode<>opcode) or (p^.ops<>ops) then          exit;        for i:=0 to p^.ops-1 do         begin           insot:=p^.optypes[i];           currot:=oper[i]^.ot;           { Check the operand flags }           if (insot and (not currot) and OT_NON_SIZE)<>0 then             exit;           { Check if the passed operand size matches with one of             the supported operand sizes }           if ((insot and OT_SIZE_MASK)<>0) and              ((insot and currot and OT_SIZE_MASK)<>(currot and OT_SIZE_MASK)) then             exit;         end;        { Check operand sizes }        insflags:=p^.flags;        if insflags and IF_SMASK<>0 then          begin            { as default an untyped size can get all the sizes, this is different              from nasm, but else we need to do a lot checking which opcodes want              size or not with the automatic size generation }            asize:=-1;            if (insflags and IF_SB)<>0 then              asize:=OT_BITS8            else if (insflags and IF_SW)<>0 then              asize:=OT_BITS16            else if (insflags and IF_SD)<>0 then              asize:=OT_BITS32;            if (insflags and IF_ARMASK)<>0 then             begin               siz[0]:=-1;               siz[1]:=-1;               siz[2]:=-1;               siz[((insflags and IF_ARMASK) shr IF_ARSHIFT)-1]:=asize;             end            else             begin               siz[0]:=asize;               siz[1]:=asize;               siz[2]:=asize;             end;            if (insflags and (IF_SM or IF_SM2))<>0 then             begin               if (insflags and IF_SM2)<>0 then                oprs:=2               else                oprs:=p^.ops;               for i:=0 to oprs-1 do                if ((p^.optypes[i] and OT_SIZE_MASK) <> 0) then                 begin                   for j:=0 to oprs-1 do                    siz[j]:=p^.optypes[i] and OT_SIZE_MASK;                   break;                 end;              end             else              oprs:=2;            { Check operand sizes }            for i:=0 to p^.ops-1 do              begin                insot:=p^.optypes[i];                currot:=oper[i]^.ot;                if ((insot and OT_SIZE_MASK)=0) and                   ((currot and OT_SIZE_MASK and (not siz[i]))<>0) and                   { Immediates can always include smaller size }                   ((currot and OT_IMMEDIATE)=0) and                    (((insot and OT_SIZE_MASK) or siz[i])<(currot and OT_SIZE_MASK)) then                  exit;              end;          end;        result:=true;      end;    procedure taicpu.ResetPass1;      begin        { we need to reset everything here, because the choosen insentry          can be invalid for a new situation where the previously optimized          insentry is not correct }        InsEntry:=nil;        InsSize:=0;        LastInsOffset:=-1;      end;    procedure taicpu.ResetPass2;      begin        { we are here in a second pass, check if the instruction can be optimized }        if assigned(InsEntry) and           ((InsEntry^.flags and IF_PASS2)<>0) then         begin           InsEntry:=nil;           InsSize:=0;         end;        LastInsOffset:=-1;      end;    function taicpu.CheckIfValid:boolean;      begin        result:=FindInsEntry(nil);      end;    function taicpu.FindInsentry(objdata:TObjData):boolean;      var        i : longint;      begin        result:=false;      { Things which may only be done once, not when a second pass is done to        optimize }        if (Insentry=nil) or ((InsEntry^.flags and IF_PASS2)<>0) then         begin           current_filepos:=fileinfo;           { We need intel style operands }           SetOperandOrder(op_intel);           { create the .ot fields }           create_ot(objdata);           { set the file postion }         end        else         begin           { we've already an insentry so it's valid }           result:=true;           exit;         end;        { Lookup opcode in the table }        InsSize:=-1;        i:=instabcache^[opcode];        if i=-1 then         begin           Message1(asmw_e_opcode_not_in_table,gas_op2str[opcode]);           exit;         end;        insentry:=@instab[i];        while (insentry^.opcode=opcode) do         begin           if matches(insentry) then             begin               result:=true;               exit;             end;           inc(insentry);         end;        Message1(asmw_e_invalid_opcode_and_operands,GetString);        { No instruction found, set insentry to nil and inssize to -1 }        insentry:=nil;        inssize:=-1;      end;    function taicpu.Pass1(objdata:TObjData):longint;      begin        Pass1:=0;        { Save the old offset and set the new offset }        InsOffset:=ObjData.CurrObjSec.Size;        { Error? }        if (Insentry=nil) and (InsSize=-1) then          exit;        { set the file postion }        current_filepos:=fileinfo;        { Get InsEntry }        if FindInsEntry(ObjData) then         begin           { Calculate instruction size }           InsSize:=calcsize(insentry);           if segprefix<>NR_NO then            inc(InsSize);           { Fix opsize if size if forced }           if (insentry^.flags and (IF_SB or IF_SW or IF_SD))<>0 then             begin               if (insentry^.flags and IF_ARMASK)=0 then                 begin                   if (insentry^.flags and IF_SB)<>0 then                     begin                       if opsize=S_NO then                         opsize:=S_B;                     end                   else if (insentry^.flags and IF_SW)<>0 then                     begin                       if opsize=S_NO then                         opsize:=S_W;                     end                   else if (insentry^.flags and IF_SD)<>0 then                     begin                       if opsize=S_NO then                         opsize:=S_L;                     end;                 end;             end;           LastInsOffset:=InsOffset;           Pass1:=InsSize;           exit;         end;        LastInsOffset:=-1;      end;    const      segprefixes: array[NR_CS..NR_GS] of Byte=(      //cs   ds   es   ss   fs   gs        $2E, $3E, $26, $36, $64, $65      );    procedure taicpu.Pass2(objdata:TObjData);      begin        { error in pass1 ? }        if insentry=nil then         exit;        current_filepos:=fileinfo;        { Segment override }        if (segprefix>=NR_CS) and (segprefix<=NR_GS) then         begin           objdata.writebytes(segprefixes[segprefix],1);           { fix the offset for GenNode }           inc(InsOffset);         end        else if segprefix<>NR_NO then          InternalError(201001071);        { Generate the instruction }        GenCode(objdata);      end;    function taicpu.needaddrprefix(opidx:byte):boolean;      begin        result:=(oper[opidx]^.typ=top_ref) and                (oper[opidx]^.ref^.refaddr=addr_no) and    {$ifdef x86_64}                (oper[opidx]^.ref^.base<>NR_RIP) and    {$endif x86_64}                (                 (                  (oper[opidx]^.ref^.index<>NR_NO) and                  (getsubreg(oper[opidx]^.ref^.index)<>R_SUBADDR)                 ) or                 (                  (oper[opidx]^.ref^.base<>NR_NO) and                  (getsubreg(oper[opidx]^.ref^.base)<>R_SUBADDR)                 )                );      end;    function regval(r:Tregister):byte;      const    {$ifdef x86_64}        opcode_table:array[tregisterindex] of tregisterindex = (          {$i r8664op.inc}        );    {$else x86_64}        opcode_table:array[tregisterindex] of tregisterindex = (          {$i r386op.inc}        );    {$endif x86_64}      var        regidx : tregisterindex;      begin        regidx:=findreg_by_number(r);        if regidx<>0 then          result:=opcode_table[regidx]        else          begin            Message1(asmw_e_invalid_register,generic_regname(r));            result:=0;          end;      end;{$ifdef x86_64}    function rexbits(r: tregister): byte;      begin        result:=0;        case getregtype(r) of          R_INTREGISTER:            if (getsupreg(r)>=RS_R8) then          { Either B,X or R bits can be set, depending on register role in instruction.            Set all three bits here, caller will discard unnecessary ones. }              result:=result or $47            else if (getsubreg(r)=R_SUBL) and              (getsupreg(r) in [RS_RDI,RS_RSI,RS_RBP,RS_RSP]) then              result:=result or $40            else if (getsubreg(r)=R_SUBH) then          { Not an actual REX bit, used to detect incompatible usage of            AH/BH/CH/DH }              result:=result or $80;          R_MMREGISTER:            if getsupreg(r)>=RS_XMM8 then              result:=result or $47;        end;      end;    function process_ea(const input:toper;out output:ea;rfield:longint):boolean;      var        sym   : tasmsymbol;        md,s,rv  : byte;        base,index,scalefactor,        o     : longint;        ir,br : Tregister;        isub,bsub : tsubregister;      begin        process_ea:=false;        fillchar(output,sizeof(output),0);        {Register ?}        if (input.typ=top_reg) then          begin            rv:=regval(input.reg);            output.modrm:=$c0 or (rfield shl 3) or rv;            output.size:=1;            output.rex:=output.rex or (rexbits(input.reg) and $F1);            process_ea:=true;            exit;         end;        {No register, so memory reference.}        if input.typ<>top_ref then          internalerror(200409263);        ir:=input.ref^.index;        br:=input.ref^.base;        isub:=getsubreg(ir);        bsub:=getsubreg(br);        s:=input.ref^.scalefactor;        o:=input.ref^.offset;        sym:=input.ref^.symbol;        if ((ir<>NR_NO) and (getregtype(ir)<>R_INTREGISTER)) or           ((br<>NR_NO) and (br<>NR_RIP) and (getregtype(br)<>R_INTREGISTER)) then          internalerror(200301081);        { it's direct address }        if (br=NR_NO) and (ir=NR_NO) then         begin           output.sib_present:=true;           output.bytes:=4;           output.modrm:=4 or (rfield shl 3);           output.sib:=$25;         end        else if (br=NR_RIP) and (ir=NR_NO) then          begin            { rip based }            output.sib_present:=false;            output.bytes:=4;            output.modrm:=5 or (rfield shl 3);          end        else        { it's an indirection }         begin           { 16 bit or 32 bit address? }           if ((ir<>NR_NO) and (isub<>R_SUBADDR)) or              ((br<>NR_NO) and (bsub<>R_SUBADDR)) then             message(asmw_e_16bit_32bit_not_supported);           { wrong, for various reasons }           if (ir=NR_ESP) or ((s<>1) and (s<>2) and (s<>4) and (s<>8) and (ir<>NR_NO)) then            exit;           output.rex:=output.rex or (rexbits(br) and $F1) or (rexbits(ir) and $F2);           process_ea:=true;           { base }           case br of             NR_R8,             NR_RAX : base:=0;             NR_R9,             NR_RCX : base:=1;             NR_R10,             NR_RDX : base:=2;             NR_R11,             NR_RBX : base:=3;             NR_R12,             NR_RSP : base:=4;             NR_R13,             NR_NO,             NR_RBP : base:=5;             NR_R14,             NR_RSI : base:=6;             NR_R15,             NR_RDI : base:=7;           else             exit;           end;           { index }           case ir of             NR_R8,             NR_RAX : index:=0;             NR_R9,             NR_RCX : index:=1;             NR_R10,             NR_RDX : index:=2;             NR_R11,             NR_RBX : index:=3;             NR_R12,             NR_NO  : index:=4;             NR_R13,             NR_RBP : index:=5;             NR_R14,             NR_RSI : index:=6;             NR_R15,             NR_RDI : index:=7;           else             exit;           end;           case s of            0,            1 : scalefactor:=0;            2 : scalefactor:=1;            4 : scalefactor:=2;            8 : scalefactor:=3;           else            exit;           end;           { If rbp or r13 is used we must always include an offset }           if (br=NR_NO) or              ((br<>NR_RBP) and (br<>NR_R13) and (o=0) and (sym=nil)) then            md:=0           else            if ((o>=-128) and (o<=127) and (sym=nil)) then             md:=1            else             md:=2;           if (br=NR_NO) or (md=2) then            output.bytes:=4           else            output.bytes:=md;           { SIB needed ? }           if (ir=NR_NO) and (br<>NR_RSP) and (br<>NR_R12) then            begin              output.sib_present:=false;              output.modrm:=(md shl 6) or (rfield shl 3) or base;            end           else            begin              output.sib_present:=true;              output.modrm:=(md shl 6) or (rfield shl 3) or 4;              output.sib:=(scalefactor shl 6) or (index shl 3) or base;            end;         end;        output.size:=1+ord(output.sib_present)+output.bytes;        process_ea:=true;      end;{$else x86_64}    function process_ea(const input:toper;out output:ea;rfield:longint):boolean;      var        sym   : tasmsymbol;        md,s,rv  : byte;        base,index,scalefactor,        o     : longint;        ir,br : Tregister;        isub,bsub : tsubregister;      begin        process_ea:=false;        fillchar(output,sizeof(output),0);        {Register ?}        if (input.typ=top_reg) then          begin            rv:=regval(input.reg);            output.modrm:=$c0 or (rfield shl 3) or rv;            output.size:=1;            process_ea:=true;            exit;         end;        {No register, so memory reference.}        if (input.typ<>top_ref) then          internalerror(200409262);        if ((input.ref^.index<>NR_NO) and (getregtype(input.ref^.index)<>R_INTREGISTER)) or           ((input.ref^.base<>NR_NO) and (getregtype(input.ref^.base)<>R_INTREGISTER)) then          internalerror(200301081);        ir:=input.ref^.index;        br:=input.ref^.base;        isub:=getsubreg(ir);        bsub:=getsubreg(br);        s:=input.ref^.scalefactor;        o:=input.ref^.offset;        sym:=input.ref^.symbol;      { it's direct address }        if (br=NR_NO) and (ir=NR_NO) then         begin           { it's a pure offset }           output.sib_present:=false;           output.bytes:=4;           output.modrm:=5 or (rfield shl 3);         end        else        { it's an indirection }         begin           { 16 bit address? }           if ((ir<>NR_NO) and (isub<>R_SUBADDR)) or              ((br<>NR_NO) and (bsub<>R_SUBADDR)) then             message(asmw_e_16bit_not_supported);{$ifdef OPTEA}           { make single reg base }           if (br=NR_NO) and (s=1) then            begin              br:=ir;              ir:=NR_NO;            end;           { convert [3,5,9]*EAX to EAX+[2,4,8]*EAX }           if (br=NR_NO) and              (((s=2) and (ir<>NR_ESP)) or                (s=3) or (s=5) or (s=9)) then            begin              br:=ir;              dec(s);            end;           { swap ESP into base if scalefactor is 1 }           if (s=1) and (ir=NR_ESP) then            begin              ir:=br;              br:=NR_ESP;            end;{$endif OPTEA}           { wrong, for various reasons }           if (ir=NR_ESP) or ((s<>1) and (s<>2) and (s<>4) and (s<>8) and (ir<>NR_NO)) then            exit;           { base }           case br of             NR_EAX : base:=0;             NR_ECX : base:=1;             NR_EDX : base:=2;             NR_EBX : base:=3;             NR_ESP : base:=4;             NR_NO,             NR_EBP : base:=5;             NR_ESI : base:=6;             NR_EDI : base:=7;           else             exit;           end;           { index }           case ir of             NR_EAX : index:=0;             NR_ECX : index:=1;             NR_EDX : index:=2;             NR_EBX : index:=3;             NR_NO  : index:=4;             NR_EBP : index:=5;             NR_ESI : index:=6;             NR_EDI : index:=7;           else             exit;           end;           case s of            0,            1 : scalefactor:=0;            2 : scalefactor:=1;            4 : scalefactor:=2;            8 : scalefactor:=3;           else            exit;           end;           if (br=NR_NO) or              ((br<>NR_EBP) and (o=0) and (sym=nil)) then            md:=0           else            if ((o>=-128) and (o<=127) and (sym=nil)) then             md:=1            else             md:=2;           if (br=NR_NO) or (md=2) then            output.bytes:=4           else            output.bytes:=md;           { SIB needed ? }           if (ir=NR_NO) and (br<>NR_ESP) then            begin              output.sib_present:=false;              output.modrm:=(longint(md) shl 6) or (rfield shl 3) or base;            end           else            begin              output.sib_present:=true;              output.modrm:=(longint(md) shl 6) or (rfield shl 3) or 4;              output.sib:=(scalefactor shl 6) or (index shl 3) or base;            end;         end;        if output.sib_present then         output.size:=2+output.bytes        else         output.size:=1+output.bytes;        process_ea:=true;      end;{$endif x86_64}    function taicpu.calcsize(p:PInsEntry):shortint;      var        codes : pchar;        c     : byte;        len     : shortint;        ea_data : ea;        omit_rexw : boolean;      begin        len:=0;        codes:=@p^.code[0];{$ifdef x86_64}        rex:=0;        omit_rexw:=false;{$endif x86_64}        repeat          c:=ord(codes^);          inc(codes);          case c of            0 :              break;            1,2,3 :              begin                inc(codes,c);                inc(len,c);              end;            8,9,10 :              begin{$ifdef x86_64}                rex:=rex or (rexbits(oper[c-8]^.reg) and $F1);{$endif x86_64}                inc(codes);                inc(len);              end;            11 :              begin                inc(codes);                inc(len);              end;            4,5,6,7 :              begin                if opsize=S_W then                  inc(len,2)                else                  inc(len);              end;            12,13,14,            16,17,18,            20,21,22,            40,41,42 :              inc(len);            24,25,26,            31,            48,49,50 :              inc(len,2);            28,29,30:              begin                if opsize=S_Q then                  inc(len,8)                else                  inc(len,4);              end;            36,37,38:              inc(len,sizeof(pint));            44,45,46:              inc(len,8);            32,33,34,            52,53,54,            56,57,58,            172,173,174 :              inc(len,4);            208,209,210 :              begin                case (oper[c-208]^.ot and OT_SIZE_MASK) of                  OT_BITS16:                    inc(len);{$ifdef x86_64}                  OT_BITS64:                    begin                      rex:=rex or $48;                    end;{$endif x86_64}                end;              end;            200 :{$ifndef x86_64}              inc(len);{$else x86_64}              { every insentry with code 0310 must be marked with NOX86_64 }              InternalError(2011051301);{$endif x86_64}            201 :{$ifdef x86_64}              inc(len){$endif x86_64}              ;            212 :              inc(len);            214 :              begin{$ifdef x86_64}                rex:=rex or $48;{$endif x86_64}              end;            202,            211,            213,            215,            217,218: ;            219,220,241 :              inc(len);            221:{$ifdef x86_64}              omit_rexw:=true{$endif x86_64}              ;            64..151 :              begin{$ifdef x86_64}                 if (c<127) then                  begin                    if (oper[c and 7]^.typ=top_reg) then                      begin                        rex:=rex or (rexbits(oper[c and 7]^.reg) and $F4);                      end;                  end;{$endif x86_64}                if not process_ea(oper[(c shr 3) and 7]^, ea_data, 0) then                  Message(asmw_e_invalid_effective_address)                else                  inc(len,ea_data.size);{$ifdef x86_64}                rex:=rex or ea_data.rex;{$endif x86_64}              end;            else             InternalError(200603141);          end;        until false;{$ifdef x86_64}        if ((rex and $80)<>0) and ((rex and $4F)<>0) then          Message(asmw_e_bad_reg_with_rex);        rex:=rex and $4F;      { reset extra bits in upper nibble }        if omit_rexw then          begin            if rex=$48 then    { remove rex entirely? }              rex:=0            else              rex:=rex and $F7;          end;        if rex<>0 then          Inc(len);{$endif}        calcsize:=len;      end;    procedure taicpu.GenCode(objdata:TObjData);      {       * the actual codes (C syntax, i.e. octal):       * \0            - terminates the code. (Unless it's a literal of course.)       * \1, \2, \3    - that many literal bytes follow in the code stream       * \4, \6        - the POP/PUSH (respectively) codes for CS, DS, ES, SS       *                 (POP is never used for CS) depending on operand 0       * \5, \7        - the second byte of POP/PUSH codes for FS, GS, depending       *                 on operand 0       * \10, \11, \12 - a literal byte follows in the code stream, to be added       *                 to the register value of operand 0, 1 or 2       * \13           - a literal byte follows in the code stream, to be added       *                 to the condition code value of the instruction.       * \14, \15, \16 - a signed byte immediate operand, from operand 0, 1 or 2       * \20, \21, \22 - a byte immediate operand, from operand 0, 1 or 2       * \24, \25, \26 - an unsigned byte immediate operand, from operand 0, 1 or 2       * \30, \31, \32 - a word immediate operand, from operand 0, 1 or 2       * \34, \35, \36 - select between \3[012] and \4[012] depending on 16/32 bit       *                 assembly mode or the address-size override on the operand       * \37           - a word constant, from the _segment_ part of operand 0       * \40, \41, \42 - a long immediate operand, from operand 0, 1 or 2       * \44, \45, \46 - select between \3[012], \4[012] or \5[456] depending                         on the address size of instruction       * \50, \51, \52 - a byte relative operand, from operand 0, 1 or 2       * \54, \55, \56 - a qword immediate, from operand 0, 1 or 2       * \60, \61, \62 - a word relative operand, from operand 0, 1 or 2       * \64, \65, \66 - select between \6[012] and \7[012] depending on 16/32 bit       *                 assembly mode or the address-size override on the operand       * \70, \71, \72 - a long relative operand, from operand 0, 1 or 2       * \1ab          - a ModRM, calculated on EA in operand a, with the spare       *                 field the register value of operand b.       * \2ab          - a ModRM, calculated on EA in operand a, with the spare       *                 field equal to digit b.       * \254,\255,\256 - a signed 32-bit immediate to be extended to 64 bits       * \300,\301,\302 - might be an 0x67, depending on the address size of       *                 the memory reference in operand x.       * \310          - indicates fixed 16-bit address size, i.e. optional 0x67.       * \311          - indicates fixed 32-bit address size, i.e. optional 0x67.       * \312          - (disassembler only) invalid with non-default address size.       * \320,\321,\322 - might be an 0x66 or 0x48 byte, depending on the operand       *                 size of operand x.       * \324          - indicates fixed 16-bit operand size, i.e. optional 0x66.       * \325          - indicates fixed 32-bit operand size, i.e. optional 0x66.       * \326          - indicates fixed 64-bit operand size, i.e. optional 0x48.       * \327          - indicates that this instruction is only valid when the       *                 operand size is the default (instruction to disassembler,       *                 generates no code in the assembler)       * \331          - instruction not valid with REP prefix.  Hint for       *                 disassembler only; for SSE instructions.       * \332	       - disassemble a rep (0xF3 byte) prefix as repe not rep.       * \333          - 0xF3 prefix for SSE instructions       * \334          - 0xF2 prefix for SSE instructions       * \335          - Indicates 64-bit operand size with REX.W not necessary       * \361          - 0x66 prefix for SSE instructions      }      var        currval : aint;        currsym : tobjsymbol;        currrelreloc,        currabsreloc,        currabsreloc32 : TObjRelocationType;{$ifdef x86_64}        rexwritten : boolean;{$endif x86_64}        procedure getvalsym(opidx:longint);          begin            case oper[opidx]^.typ of              top_ref :                begin                  currval:=oper[opidx]^.ref^.offset;                  currsym:=ObjData.symbolref(oper[opidx]^.ref^.symbol);{$ifdef i386}                  if (oper[opidx]^.ref^.refaddr=addr_pic) and                     (tf_pic_uses_got in target_info.flags) then                    begin                      currrelreloc:=RELOC_PLT32;                      currabsreloc:=RELOC_GOT32;                      currabsreloc32:=RELOC_GOT32;                    end                  else{$endif i386}{$ifdef x86_64}                  if oper[opidx]^.ref^.refaddr=addr_pic then                    begin                      currrelreloc:=RELOC_PLT32;                      currabsreloc:=RELOC_GOTPCREL;                      currabsreloc32:=RELOC_GOTPCREL;                    end                  else if oper[opidx]^.ref^.refaddr=addr_pic_no_got then                    begin                      currrelreloc:=RELOC_RELATIVE;                      currabsreloc:=RELOC_RELATIVE;                      currabsreloc32:=RELOC_RELATIVE;                    end                  else{$endif x86_64}                    begin                      currrelreloc:=RELOC_RELATIVE;                      currabsreloc:=RELOC_ABSOLUTE;                      currabsreloc32:=RELOC_ABSOLUTE32;                    end;                end;              top_const :                begin                  currval:=aint(oper[opidx]^.val);                  currsym:=nil;                  currabsreloc:=RELOC_ABSOLUTE;                  currabsreloc32:=RELOC_ABSOLUTE32;                end;              else                Message(asmw_e_immediate_or_reference_expected);            end;          end;{$ifdef x86_64}       procedure maybewriterex;       begin          if (rex<>0) and not(rexwritten) then            begin              rexwritten:=true;              objdata.writebytes(rex,1);            end;        end;{$endif x86_64}       procedure objdata_writereloc(Data:aint;len:aword;p:TObjSymbol;Reloctype:TObjRelocationType);         begin{$ifdef i386}               { Special case of '_GLOBAL_OFFSET_TABLE_'                 which needs a special relocation type R_386_GOTPC }               if assigned (p) and                  (p.name='_GLOBAL_OFFSET_TABLE_') and                  (tf_pic_uses_got in target_info.flags) then                 begin                   { nothing else than a 4 byte relocation should occur                     for GOT }                   if len<>4 then                     Message1(asmw_e_invalid_opcode_and_operands,GetString);                   Reloctype:=RELOC_GOTPC;                   { We need to add the offset of the relocation                     of _GLOBAL_OFFSET_TABLE symbol within                     the current instruction }                   inc(data,objdata.currobjsec.size-insoffset);                 end;{$endif i386}           objdata.writereloc(data,len,p,Reloctype);         end;      const        CondVal:array[TAsmCond] of byte=($0,         $7, $3, $2, $6, $2, $4, $F, $D, $C, $E, $6, $2,         $3, $7, $3, $5, $E, $C, $D, $F, $1, $B, $9, $5,         $0, $A, $A, $B, $8, $4);      var        c : byte;        pb : pbyte;        codes : pchar;        bytes : array[0..3] of byte;        rfield,        data,s,opidx : longint;        ea_data : ea;        relsym : TObjSymbol;      begin        { safety check }        if objdata.currobjsec.size<>longword(insoffset) then           internalerror(200130121);        { load data to write }        codes:=insentry^.code;{$ifdef x86_64}        rexwritten:=false;{$endif x86_64}        { Force word push/pop for registers }        if (opsize=S_W) and ((codes[0]=#4) or (codes[0]=#6) or            ((codes[0]=#1) and ((codes[2]=#5) or (codes[2]=#7)))) then          begin            bytes[0]:=$66;            objdata.writebytes(bytes,1);          end;        repeat          c:=ord(codes^);          inc(codes);          case c of            0 :              break;            1,2,3 :              begin{$ifdef x86_64}                maybewriterex;{$endif x86_64}                objdata.writebytes(codes^,c);                inc(codes,c);              end;            4,6 :              begin                case oper[0]^.reg of                  NR_CS:                    bytes[0]:=$e;                  NR_NO,                  NR_DS:                    bytes[0]:=$1e;                  NR_ES:                    bytes[0]:=$6;                  NR_SS:                    bytes[0]:=$16;                  else                    internalerror(777004);                end;                if c=4 then                  inc(bytes[0]);                objdata.writebytes(bytes,1);              end;            5,7 :              begin                case oper[0]^.reg of                  NR_FS:                    bytes[0]:=$a0;                  NR_GS:                    bytes[0]:=$a8;                  else                    internalerror(777005);                end;                if c=5 then                  inc(bytes[0]);                objdata.writebytes(bytes,1);              end;            8,9,10 :              begin{$ifdef x86_64}                maybewriterex;{$endif x86_64}                bytes[0]:=ord(codes^)+regval(oper[c-8]^.reg);                inc(codes);                objdata.writebytes(bytes,1);              end;            11 :              begin                bytes[0]:=ord(codes^)+condval[condition];                inc(codes);                objdata.writebytes(bytes,1);              end;            12,13,14 :              begin                getvalsym(c-12);                if (currval<-128) or (currval>127) then                 Message2(asmw_e_value_exceeds_bounds,'signed byte',tostr(currval));                if assigned(currsym) then                  objdata_writereloc(currval,1,currsym,currabsreloc)                else                  objdata.writebytes(currval,1);              end;            16,17,18 :              begin                getvalsym(c-16);                if (currval<-256) or (currval>255) then                 Message2(asmw_e_value_exceeds_bounds,'byte',tostr(currval));                if assigned(currsym) then                 objdata_writereloc(currval,1,currsym,currabsreloc)                else                 objdata.writebytes(currval,1);              end;            20,21,22 :              begin                getvalsym(c-20);                if (currval<0) or (currval>255) then                 Message2(asmw_e_value_exceeds_bounds,'unsigned byte',tostr(currval));                if assigned(currsym) then                 objdata_writereloc(currval,1,currsym,currabsreloc)                else                 objdata.writebytes(currval,1);              end;            24,25,26 :     // 030..032              begin                getvalsym(c-24);                if (currval<-65536) or (currval>65535) then                 Message2(asmw_e_value_exceeds_bounds,'word',tostr(currval));                if assigned(currsym) then                 objdata_writereloc(currval,2,currsym,currabsreloc)                else                 objdata.writebytes(currval,2);              end;            28,29,30 :     // 034..036              { !!! These are intended (and used in opcode table) to select depending                    on address size, *not* operand size. Works by coincidence only. }              begin                getvalsym(c-28);                if opsize=S_Q then                  begin                    if assigned(currsym) then                     objdata_writereloc(currval,8,currsym,currabsreloc)                    else                     objdata.writebytes(currval,8);                  end                else                  begin                    if assigned(currsym) then                      objdata_writereloc(currval,4,currsym,currabsreloc32)                    else                      objdata.writebytes(currval,4);                  end              end;            32,33,34 :    // 040..042              begin                getvalsym(c-32);                if assigned(currsym) then                 objdata_writereloc(currval,4,currsym,currabsreloc32)                else                 objdata.writebytes(currval,4);              end;            36,37,38 :   // 044..046 - select between word/dword/qword depending on              begin      // address size (we support only default address sizes).                getvalsym(c-36);{$ifdef x86_64}                if assigned(currsym) then                  objdata_writereloc(currval,8,currsym,currabsreloc)                else                  objdata.writebytes(currval,8);{$else x86_64}                if assigned(currsym) then                  objdata_writereloc(currval,4,currsym,currabsreloc32)                else                  objdata.writebytes(currval,4);{$endif x86_64}              end;            40,41,42 :   // 050..052 - byte relative operand              begin                getvalsym(c-40);                data:=currval-insend;                if assigned(currsym) then                 inc(data,currsym.address);                if (data>127) or (data<-128) then                 Message1(asmw_e_short_jmp_out_of_range,tostr(data));                objdata.writebytes(data,1);              end;            44,45,46:   // 054..056 - qword immediate operand              begin                getvalsym(c-44);                if assigned(currsym) then                  objdata_writereloc(currval,8,currsym,currabsreloc)                else                  objdata.writebytes(currval,8);              end;            52,53,54 :  // 064..066 - select between 16/32 address mode, but we support only 32              begin                getvalsym(c-52);                if assigned(currsym) then                 objdata_writereloc(currval,4,currsym,currrelreloc)                else                 objdata_writereloc(currval-insend,4,nil,currabsreloc32)              end;            56,57,58 :  // 070..072 - long relative operand              begin                getvalsym(c-56);                if assigned(currsym) then                 objdata_writereloc(currval,4,currsym,currrelreloc)                else                 objdata_writereloc(currval-insend,4,nil,currabsreloc32)              end;            172,173,174 :  // 0254..0256 - dword implicitly sign-extended to 64-bit (x86_64 only)              begin                getvalsym(c-172);{$ifdef x86_64}                { for i386 as aint type is longint the                  following test is useless }                if (currval<low(longint)) or (currval>high(longint)) then                  Message2(asmw_e_value_exceeds_bounds,'signed dword',tostr(currval));{$endif x86_64}                if assigned(currsym) then                  objdata_writereloc(currval,4,currsym,currabsreloc32)                else                  objdata.writebytes(currval,4);              end;            200 :   { fixed 16-bit addr }{$ifndef x86_64}              begin                bytes[0]:=$67;                objdata.writebytes(bytes,1);              end;{$else x86_64}              { every insentry having code 0310 must be marked with NOX86_64 }              InternalError(2011051302);{$endif}            201 :   { fixed 32-bit addr }{$ifdef x86_64}              begin                bytes[0]:=$67;                objdata.writebytes(bytes,1);              end{$endif x86_64}               ;            208,209,210 :              begin                case oper[c-208]^.ot and OT_SIZE_MASK of                  OT_BITS16 :                    begin                      bytes[0]:=$66;                      objdata.writebytes(bytes,1);                    end;{$ifndef x86_64}                  OT_BITS64 :                      Message(asmw_e_64bit_not_supported);{$endif x86_64}                end;              end;            211,            213 : {no action needed};            212, 241 :              begin                bytes[0]:=$66;                objdata.writebytes(bytes,1);              end;            214 :              begin{$ifndef x86_64}                Message(asmw_e_64bit_not_supported);{$endif x86_64}              end;            219 :              begin                bytes[0]:=$f3;                objdata.writebytes(bytes,1);              end;            220 :              begin                bytes[0]:=$f2;                objdata.writebytes(bytes,1);              end;            221:              ;            202,            215,            217,218 :              begin                { these are dissambler hints or 32 bit prefixes which                  are not needed }              end;            31,            48,49,50 :              begin                InternalError(777006);              end            else              begin                { rex should be written at this point }{$ifdef x86_64}                if (rex<>0) and not(rexwritten) then                  internalerror(200603191);{$endif x86_64}                if (c>=64) and (c<=151) then  // 0100..0227                 begin                   if (c<127) then            // 0177                    begin                      if (oper[c and 7]^.typ=top_reg) then                        rfield:=regval(oper[c and 7]^.reg)                      else                        rfield:=regval(oper[c and 7]^.ref^.base);                    end                   else                    rfield:=c and 7;                   opidx:=(c shr 3) and 7;                   if not process_ea(oper[opidx]^,ea_data,rfield) then                     Message(asmw_e_invalid_effective_address);                   pb:=@bytes[0];                   pb^:=ea_data.modrm;                   inc(pb);                   if ea_data.sib_present then                    begin                      pb^:=ea_data.sib;                      inc(pb);                    end;                   s:=pb-@bytes[0];                   objdata.writebytes(bytes,s);                   case ea_data.bytes of                     0 : ;                     1 :                       begin                         if (oper[opidx]^.ot and OT_MEMORY)=OT_MEMORY then                           begin                             currsym:=objdata.symbolref(oper[opidx]^.ref^.symbol);{$ifdef i386}                             if (oper[opidx]^.ref^.refaddr=addr_pic) and                                (tf_pic_uses_got in target_info.flags) then                               currabsreloc:=RELOC_GOT32                             else{$endif i386}{$ifdef x86_64}                             if oper[opidx]^.ref^.refaddr=addr_pic then                               currabsreloc:=RELOC_GOTPCREL                             else{$endif x86_64}                               currabsreloc:=RELOC_ABSOLUTE;                             objdata_writereloc(oper[opidx]^.ref^.offset,1,currsym,currabsreloc);                           end                         else                          begin                            bytes[0]:=oper[opidx]^.ref^.offset;                            objdata.writebytes(bytes,1);                          end;                         inc(s);                       end;                     2,4 :                       begin                         currsym:=objdata.symbolref(oper[opidx]^.ref^.symbol);                         currval:=oper[opidx]^.ref^.offset;{$ifdef x86_64}                         if oper[opidx]^.ref^.refaddr=addr_pic then                           currabsreloc:=RELOC_GOTPCREL                         else                           if oper[opidx]^.ref^.base=NR_RIP then                             begin                               currabsreloc:=RELOC_RELATIVE;                               { Adjust reloc value by number of bytes following the displacement,                                 but not if displacement is specified by literal constant }                               if Assigned(currsym) then                                 Dec(currval,InsEnd-objdata.CurrObjSec.Size-ea_data.bytes);                             end                           else{$endif x86_64}{$ifdef i386}                         if (oper[opidx]^.ref^.refaddr=addr_pic) and                            (tf_pic_uses_got in target_info.flags) then                           currabsreloc:=RELOC_GOT32                         else{$endif i386}                             currabsreloc:=RELOC_ABSOLUTE32;                           if (currabsreloc=RELOC_ABSOLUTE32) and                            (Assigned(oper[opidx]^.ref^.relsymbol)) then                           begin                             relsym:=objdata.symbolref(oper[opidx]^.ref^.relsymbol);                             currabsreloc:=RELOC_PIC_PAIR;                             currval:=relsym.offset;                           end;                         objdata_writereloc(currval,ea_data.bytes,currsym,currabsreloc);                         inc(s,ea_data.bytes);                       end;                   end;                 end                else                 InternalError(777007);              end;          end;        until false;      end;    function taicpu.is_same_reg_move(regtype: Tregistertype):boolean;      begin        result:=(((opcode=A_MOV) or (opcode=A_XCHG)) and                 (regtype = R_INTREGISTER) and                 (ops=2) and                 (oper[0]^.typ=top_reg) and                 (oper[1]^.typ=top_reg) and                 (oper[0]^.reg=oper[1]^.reg)                ) or                (((opcode=A_MOVSS) or (opcode=A_MOVSD) or (opcode=A_MOVQ) or                  (opcode=A_MOVAPS) or (OPCODE=A_MOVAPD)) and                 (regtype = R_MMREGISTER) and                 (ops=2) and                 (oper[0]^.typ=top_reg) and                 (oper[1]^.typ=top_reg) and                 (oper[0]^.reg=oper[1]^.reg)                );      end;    procedure build_spilling_operation_type_table;      var        opcode : tasmop;        i      : integer;      begin        new(operation_type_table);        fillchar(operation_type_table^,sizeof(toperation_type_table),byte(operand_read));        for opcode:=low(tasmop) to high(tasmop) do          begin            for i:=1 to MaxInsChanges do              begin                case InsProp[opcode].Ch[i] of                  Ch_Rop1 :                    operation_type_table^[opcode,0]:=operand_read;                  Ch_Wop1 :                    operation_type_table^[opcode,0]:=operand_write;                  Ch_RWop1,                  Ch_Mop1 :                    operation_type_table^[opcode,0]:=operand_readwrite;                  Ch_Rop2 :                    operation_type_table^[opcode,1]:=operand_read;                  Ch_Wop2 :                    operation_type_table^[opcode,1]:=operand_write;                  Ch_RWop2,                  Ch_Mop2 :                    operation_type_table^[opcode,1]:=operand_readwrite;                  Ch_Rop3 :                    operation_type_table^[opcode,2]:=operand_read;                  Ch_Wop3 :                    operation_type_table^[opcode,2]:=operand_write;                  Ch_RWop3,                  Ch_Mop3 :                    operation_type_table^[opcode,2]:=operand_readwrite;                end;              end;          end;        { Special cases that can't be decoded from the InsChanges flags }        operation_type_table^[A_IMUL,1]:=operand_readwrite;      end;    function taicpu.spilling_get_operation_type(opnr: longint): topertype;      begin        { the information in the instruction table is made for the string copy          operation MOVSD so hack here (FK)        }        if (opcode=A_MOVSD) and (ops=2) then          begin            case opnr of              0:                result:=operand_read;              1:                result:=operand_write;              else                internalerror(200506055);            end          end        else          result:=operation_type_table^[opcode,opnr];      end;    function spilling_create_load(const ref:treference;r:tregister):Taicpu;      begin        case getregtype(r) of          R_INTREGISTER :            { we don't need special code here for 32 bit loads on x86_64, since              those will automatically zero-extend the upper 32 bits. }            result:=taicpu.op_ref_reg(A_MOV,reg2opsize(r),ref,r);          R_MMREGISTER :            case getsubreg(r) of              R_SUBMMD:                result:=taicpu.op_ref_reg(A_MOVSD,reg2opsize(r),ref,r);              R_SUBMMS:                result:=taicpu.op_ref_reg(A_MOVSS,reg2opsize(r),ref,r);              R_SUBMMWHOLE:                result:=taicpu.op_ref_reg(A_MOVQ,S_NO,ref,r);              else                internalerror(200506043);            end;          else            internalerror(200401041);        end;      end;    function spilling_create_store(r:tregister; const ref:treference):Taicpu;      var        size: topsize;      begin        case getregtype(r) of          R_INTREGISTER :            begin              size:=reg2opsize(r);{$ifdef x86_64}              { even if it's a 32 bit reg, we still have to spill 64 bits                because we often perform 64 bit operations on them }              if (size=S_L) then                begin                  size:=S_Q;                  r:=newreg(getregtype(r),getsupreg(r),R_SUBWHOLE);                end;{$endif x86_64}              result:=taicpu.op_reg_ref(A_MOV,size,r,ref);            end;          R_MMREGISTER :            case getsubreg(r) of              R_SUBMMD:                result:=taicpu.op_reg_ref(A_MOVSD,reg2opsize(r),r,ref);              R_SUBMMS:                result:=taicpu.op_reg_ref(A_MOVSS,reg2opsize(r),r,ref);              R_SUBMMWHOLE:                result:=taicpu.op_reg_ref(A_MOVQ,S_NO,r,ref);              else                internalerror(200506042);            end;          else            internalerror(200401041);        end;      end;{*****************************************************************************                              Instruction table*****************************************************************************}    procedure BuildInsTabCache;      var        i : longint;      begin        new(instabcache);        FillChar(instabcache^,sizeof(tinstabcache),$ff);        i:=0;        while (i<InsTabEntries) do         begin           if InsTabCache^[InsTab[i].OPcode]=-1 then            InsTabCache^[InsTab[i].OPcode]:=i;           inc(i);         end;      end;    procedure InitAsm;      begin        build_spilling_operation_type_table;        if not assigned(instabcache) then          BuildInsTabCache;      end;    procedure DoneAsm;      begin        if assigned(operation_type_table) then          begin            dispose(operation_type_table);            operation_type_table:=nil;          end;        if assigned(instabcache) then          begin            dispose(instabcache);            instabcache:=nil;          end;      end;begin  cai_align:=tai_align;  cai_cpu:=taicpu;end.
 |