| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311 | {    Copyright (c) 1998-2002 by Florian Klaempfl    This unit implements the code generator for the i8086    This program is free software; you can redistribute it and/or modify    it under the terms of the GNU General Public License as published by    the Free Software Foundation; either version 2 of the License, or    (at your option) any later version.    This program is distributed in the hope that it will be useful,    but WITHOUT ANY WARRANTY; without even the implied warranty of    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the    GNU General Public License for more details.    You should have received a copy of the GNU General Public License    along with this program; if not, write to the Free Software    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. ****************************************************************************}unit cgcpu;{$i fpcdefs.inc}  interface    uses       globtype,       cgbase,cgobj,cg64f32,cgx86,       aasmbase,aasmtai,aasmdata,aasmcpu,       cpubase,parabase,cgutils,       symconst,symdef       ;    type      { tcg8086 }      tcg8086 = class(tcgx86)        procedure init_register_allocators;override;        procedure do_register_allocation(list:TAsmList;headertai:tai);override;        function getintregister(list:TAsmList;size:Tcgsize):Tregister;override;        procedure a_call_name(list : TAsmList;const s : string; weak: boolean);override;        procedure a_call_name_far(list : TAsmList;const s : string; weak: boolean);        procedure a_call_name_static(list : TAsmList;const s : string);override;        procedure a_call_name_static_far(list : TAsmList;const s : string);        procedure a_call_reg(list : TAsmList;reg : tregister);override;        procedure a_call_reg_far(list : TAsmList;reg : tregister);        procedure a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; reg: TRegister); override;        procedure a_op_const_ref(list : TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference); override;        procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;        procedure a_op_ref_reg(list : TAsmList; Op: TOpCG; size: TCGSize; const ref: TReference; reg: TRegister); override;        procedure a_op_reg_ref(list : TAsmList; Op: TOpCG; size: TCGSize;reg: TRegister; const ref: TReference); override;        procedure push_const(list:TAsmList;size:tcgsize;a:tcgint);        { passing parameter using push instead of mov }        procedure a_load_reg_cgpara(list : TAsmList;size : tcgsize;r : tregister;const cgpara : tcgpara);override;        procedure a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const cgpara : tcgpara);override;        procedure a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const cgpara : tcgpara);override;        procedure a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const cgpara : tcgpara);override;        { move instructions }        procedure a_load_const_reg(list : TAsmList; tosize: tcgsize; a : tcgint;reg : tregister);override;        procedure a_load_const_ref(list : TAsmList; tosize: tcgsize; a : tcgint;const ref : treference);override;        procedure a_load_reg_ref(list : TAsmList;fromsize,tosize: tcgsize; reg : tregister;const ref : treference);override;        procedure a_load_ref_reg(list : TAsmList;fromsize,tosize: tcgsize;const ref : treference;reg : tregister);override;        procedure a_load_reg_reg(list : TAsmList;fromsize,tosize: tcgsize;reg1,reg2 : tregister);override;        {  comparison operations }        procedure a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;reg : tregister;          l : tasmlabel);override;        procedure a_cmp_const_ref_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : tcgint;const ref : treference;          l : tasmlabel);override;        procedure a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel); override;        procedure a_cmp_ref_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;const ref: treference; reg : tregister; l : tasmlabel); override;        procedure a_cmp_reg_ref_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg : tregister; const ref: treference; l : tasmlabel); override;        procedure gen_cmp32_jmp1(list: TAsmList; cmp_op: topcmp; l_skip, l_target: TAsmLabel);        procedure gen_cmp32_jmp2(list: TAsmList; cmp_op: topcmp; l_skip, l_target: TAsmLabel);        procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: tresflags; reg: TRegister);override;        procedure g_flags2ref(list: TAsmList; size: TCgSize; const f: tresflags; const ref: TReference);override;        procedure g_stackpointer_alloc(list : TAsmList;localsize: longint);override;        procedure g_proc_exit(list : TAsmList;parasize:longint;nostackframe:boolean);override;        procedure g_copyvaluepara_openarray(list : TAsmList;const ref:treference;const lenloc:tlocation;elesize:tcgint;destreg:tregister);        procedure g_releasevaluepara_openarray(list : TAsmList;const l:tlocation);        procedure g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);override;        procedure get_32bit_ops(op: TOpCG; out op1,op2: TAsmOp);        procedure add_move_instruction(instr:Taicpu);override;     end;      tcg64f8086 = class(tcg64f32)        procedure a_op64_ref_reg(list : TAsmList;op:TOpCG;size : tcgsize;const ref : treference;reg : tregister64);override;        procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;        procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;        procedure a_op64_const_ref(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;const ref : treference);override;      private        procedure get_64bit_ops(op:TOpCG;var op1,op2:TAsmOp);      end;    procedure create_codegen;  implementation    uses       globals,verbose,systems,cutils,       paramgr,procinfo,fmodule,       rgcpu,rgx86,cpuinfo,       symtype,symsym,symcpu,       tgobj,       hlcgobj;    function use_push(const cgpara:tcgpara):boolean;      begin        result:=(not paramanager.use_fixed_stack) and                assigned(cgpara.location) and                (cgpara.location^.loc=LOC_REFERENCE) and                (cgpara.location^.reference.index=NR_STACK_POINTER_REG);      end;    procedure tcg8086.init_register_allocators;      begin        inherited init_register_allocators;        if cs_create_pic in current_settings.moduleswitches then          rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,[RS_AX,RS_DX,RS_CX,RS_SI,RS_DI],first_int_imreg,[RS_BP])        else          if (cs_useebp in current_settings.optimizerswitches) and assigned(current_procinfo) and (current_procinfo.framepointer<>NR_BP) then            rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,[RS_AX,RS_DX,RS_CX,RS_BX,RS_SI,RS_DI,RS_BP],first_int_imreg,[])          else            rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,[RS_AX,RS_DX,RS_CX,RS_BX,RS_SI,RS_DI],first_int_imreg,[RS_BP]);        rg[R_MMXREGISTER]:=trgcpu.create(R_MMXREGISTER,R_SUBNONE,[RS_XMM0,RS_XMM1,RS_XMM2,RS_XMM3,RS_XMM4,RS_XMM5,RS_XMM6,RS_XMM7],first_mm_imreg,[]);        rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBWHOLE,[RS_XMM0,RS_XMM1,RS_XMM2,RS_XMM3,RS_XMM4,RS_XMM5,RS_XMM6,RS_XMM7],first_mm_imreg,[]);        rgfpu:=Trgx86fpu.create;      end;    procedure tcg8086.do_register_allocation(list:TAsmList;headertai:tai);      begin        if (pi_needs_got in current_procinfo.flags) then          begin            if getsupreg(current_procinfo.got) < first_int_imreg then              include(rg[R_INTREGISTER].used_in_proc,getsupreg(current_procinfo.got));          end;        inherited do_register_allocation(list,headertai);      end;    function tcg8086.getintregister(list: TAsmList; size: Tcgsize): Tregister;      begin        case size of          OS_8, OS_S8,          OS_16, OS_S16:            Result := inherited getintregister(list, size);          OS_32, OS_S32:            begin              Result:=inherited getintregister(list, OS_16);              { ensure that the high register can be retrieved by                GetNextReg              }              if inherited getintregister(list, OS_16)<>GetNextReg(Result) then                internalerror(2013030202);            end;          else            internalerror(2013030201);        end;      end;    procedure tcg8086.a_call_name(list: TAsmList; const s: string; weak: boolean);      begin        if current_settings.x86memorymodel in x86_far_code_models then          a_call_name_far(list,s,weak)        else          a_call_name_near(list,s,weak);      end;    procedure tcg8086.a_call_name_far(list: TAsmList; const s: string;      weak: boolean);      var        sym : tasmsymbol;      begin        if not(weak) then          sym:=current_asmdata.RefAsmSymbol(s)        else          sym:=current_asmdata.WeakRefAsmSymbol(s);        list.concat(taicpu.op_sym(A_CALL,S_FAR,sym));      end;    procedure tcg8086.a_call_name_static(list: TAsmList; const s: string);      begin        if current_settings.x86memorymodel in x86_far_code_models then          a_call_name_static_far(list,s)        else          a_call_name_static_near(list,s);      end;    procedure tcg8086.a_call_name_static_far(list: TAsmList; const s: string);      var        sym : tasmsymbol;      begin        sym:=current_asmdata.RefAsmSymbol(s);        list.concat(taicpu.op_sym(A_CALL,S_FAR,sym));      end;    procedure tcg8086.a_call_reg(list: TAsmList; reg: tregister);      begin        if current_settings.x86memorymodel in x86_far_code_models then          a_call_reg_far(list,reg)        else          a_call_reg_near(list,reg);      end;    procedure tcg8086.a_call_reg_far(list: TAsmList; reg: tregister);      var        href: treference;      begin        { unfortunately, x86 doesn't have a 'call far reg:reg' instruction, so }        { we have to use a temp }        tg.gettemp(list,4,2,tt_normal,href);        { HACK!!! at this point all registers are allocated, due to the fact that          in the pascal calling convention, all registers are caller saved. This          causes the register allocator to fail on the next move instruction, so we          temporarily deallocate 2 registers.          TODO: figure out a better way to do this. }        cg.ungetcpuregister(list,NR_BX);        cg.ungetcpuregister(list,NR_SI);        a_load_reg_ref(list,OS_32,OS_32,reg,href);        cg.getcpuregister(list,NR_BX);        cg.getcpuregister(list,NR_SI);        href.segment:=NR_NO;        list.concat(taicpu.op_ref(A_CALL,S_FAR,href));        tg.ungettemp(list,href);      end;    procedure tcg8086.a_op_const_reg(list: TAsmList; Op: TOpCG; size: TCGSize;      a: tcgint; reg: TRegister);      var        tmpreg: tregister;        op1, op2: TAsmOp;        ax_subreg: tregister;        hl_loop_start: tasmlabel;        ai: taicpu;        use_loop: Boolean;        i: Integer;      begin        optimize_op_const(size, op, a);        check_register_size(size,reg);        if size in [OS_64, OS_S64] then          internalerror(2013030904);        if size in [OS_32, OS_S32] then          begin            case op of              OP_NONE:                begin                  { Opcode is optimized away }                end;              OP_MOVE:                begin                  { Optimized, replaced with a simple load }                  a_load_const_reg(list,size,a,reg);                end;              OP_ADD, OP_SUB:                begin                  get_32bit_ops(op, op1, op2);                  { Optimization when the low 16-bits of the constant are 0 }                  if aint(a and $FFFF) = 0 then                    begin                      { use a_op_const_reg to allow the use of inc/dec }                      a_op_const_reg(list,op,OS_16,aint(a shr 16),GetNextReg(reg));                    end                  else                    begin                      list.concat(taicpu.op_const_reg(op1,S_W,aint(a and $FFFF),reg));                      list.concat(taicpu.op_const_reg(op2,S_W,aint(a shr 16),GetNextReg(reg)));                    end;                end;              OP_AND, OP_OR, OP_XOR:                begin                  { low word operation }                  if aint(a and $FFFF) = aint(0) then                    begin                      case op of                        OP_AND:                          a_load_const_reg(list,OS_16,aint(0),reg);                        OP_OR,OP_XOR:                          {do nothing};                        else                          InternalError(2013100701);                      end;                    end                  else if aint(a and $FFFF) = aint($FFFF) then                    begin                      case op of                        OP_AND:                          {do nothing};                        OP_OR:                          a_load_const_reg(list,OS_16,aint($FFFF),reg);                        OP_XOR:                          list.concat(taicpu.op_reg(A_NOT,S_W,reg));                        else                          InternalError(2013100701);                      end;                    end                  else                    a_op_const_reg(list,op,OS_16,aint(a and $FFFF),reg);                  { high word operation }                  if aint(a shr 16) = aint(0) then                    begin                      case op of                        OP_AND:                          a_load_const_reg(list,OS_16,aint(0),GetNextReg(reg));                        OP_OR,OP_XOR:                          {do nothing};                        else                          InternalError(2013100701);                      end;                    end                  else if aint(a shr 16) = aint($FFFF) then                    begin                      case op of                        OP_AND:                          {do nothing};                        OP_OR:                          a_load_const_reg(list,OS_16,aint($FFFF),GetNextReg(reg));                        OP_XOR:                          list.concat(taicpu.op_reg(A_NOT,S_W,GetNextReg(reg)));                        else                          InternalError(2013100701);                      end;                    end                  else                    a_op_const_reg(list,op,OS_16,aint(a shr 16),GetNextReg(reg));                end;              OP_SHR,OP_SHL,OP_SAR:                begin                  a:=a and 31;                  { for shl with const >= 16, we can just move the low register                    to the high reg, then zero the low register, then do the                    remaining part of the shift (by const-16) in 16 bit on the                    high register. the same thing applies to shr with low and high                    reversed. sar is exactly like shr, except that instead of                    zeroing the high register, we sar it by 15. }                  if a>=16 then                    case op of                      OP_SHR:                        begin                          a_load_reg_reg(list,OS_16,OS_16,GetNextReg(reg),reg);                          a_load_const_reg(list,OS_16,0,GetNextReg(reg));                          a_op_const_reg(list,OP_SHR,OS_16,a-16,reg);                        end;                      OP_SHL:                        begin                          a_load_reg_reg(list,OS_16,OS_16,reg,GetNextReg(reg));                          a_load_const_reg(list,OS_16,0,reg);                          a_op_const_reg(list,OP_SHL,OS_16,a-16,GetNextReg(reg));                        end;                      OP_SAR:                        begin                          if a=31 then                            begin                              a_op_const_reg(list,OP_SAR,OS_16,15,GetNextReg(reg));                              a_load_reg_reg(list,OS_16,OS_16,GetNextReg(reg),reg);                            end                          else                            begin                              a_load_reg_reg(list,OS_16,OS_16,GetNextReg(reg),reg);                              a_op_const_reg(list,OP_SAR,OS_16,15,GetNextReg(reg));                              a_op_const_reg(list,OP_SAR,OS_16,a-16,reg);                            end;                        end;                      else                        internalerror(2013060201);                    end                  else if a<>0 then                    begin                      use_loop:=a>2;                      if use_loop then                        begin                          getcpuregister(list,NR_CX);                          a_load_const_reg(list,OS_16,a,NR_CX);                          current_asmdata.getjumplabel(hl_loop_start);                          a_label(list,hl_loop_start);                          case op of                            OP_SHR:                              begin                                list.concat(taicpu.op_const_reg(A_SHR,S_W,1,GetNextReg(reg)));                                list.concat(taicpu.op_const_reg(A_RCR,S_W,1,reg));                              end;                            OP_SAR:                              begin                                list.concat(taicpu.op_const_reg(A_SAR,S_W,1,GetNextReg(reg)));                                list.concat(taicpu.op_const_reg(A_RCR,S_W,1,reg));                              end;                            OP_SHL:                              begin                                list.concat(taicpu.op_const_reg(A_SHL,S_W,1,reg));                                list.concat(taicpu.op_const_reg(A_RCL,S_W,1,GetNextReg(reg)));                              end;                            else                              internalerror(2013030903);                          end;                          ai:=Taicpu.Op_Sym(A_LOOP,S_W,hl_loop_start);                          ai.is_jmp:=true;                          list.concat(ai);                          ungetcpuregister(list,NR_CX);                        end                      else                        begin                          for i:=1 to a do                            begin                              case op of                                OP_SHR:                                  begin                                    list.concat(taicpu.op_const_reg(A_SHR,S_W,1,GetNextReg(reg)));                                    list.concat(taicpu.op_const_reg(A_RCR,S_W,1,reg));                                  end;                                OP_SAR:                                  begin                                    list.concat(taicpu.op_const_reg(A_SAR,S_W,1,GetNextReg(reg)));                                    list.concat(taicpu.op_const_reg(A_RCR,S_W,1,reg));                                  end;                                OP_SHL:                                  begin                                    list.concat(taicpu.op_const_reg(A_SHL,S_W,1,reg));                                    list.concat(taicpu.op_const_reg(A_RCL,S_W,1,GetNextReg(reg)));                                  end;                                else                                  internalerror(2013030903);                              end;                            end;                        end;                    end;                end;              else                begin                  tmpreg:=getintregister(list,size);                  a_load_const_reg(list,size,a,tmpreg);                  a_op_reg_reg(list,op,size,tmpreg,reg);                end;            end;          end        else          begin            { size <= 16-bit }            { 8086 doesn't support 'imul reg,const', so we handle it here }            if (current_settings.cputype<cpu_186) and (op in [OP_MUL,OP_IMUL]) then              begin                if op = OP_IMUL then                  begin                    if size in [OS_16,OS_S16] then                      ax_subreg := NR_AX                    else                      if size in [OS_8,OS_S8] then                        ax_subreg := NR_AL                      else                        internalerror(2013050102);                    getcpuregister(list,NR_AX);                    a_load_const_reg(list,size,a,ax_subreg);                    if size in [OS_16,OS_S16] then                      getcpuregister(list,NR_DX);                    { prefer MUL over IMUL when overflow checking is off, }                    { because it's faster on the 8086 & 8088              }                    if not (cs_check_overflow in current_settings.localswitches) then                      list.concat(taicpu.op_reg(A_MUL,TCgSize2OpSize[size],reg))                    else                      list.concat(taicpu.op_reg(A_IMUL,TCgSize2OpSize[size],reg));                    if size in [OS_16,OS_S16] then                      ungetcpuregister(list,NR_DX);                    a_load_reg_reg(list,size,size,ax_subreg,reg);                    ungetcpuregister(list,NR_AX);                    exit;                  end                else                  { OP_MUL should be handled specifically in the code        }                  { generator because of the silly register usage restraints }                  internalerror(200109225);              end            else              inherited a_op_const_reg(list, Op, size, a, reg);          end;      end;    procedure tcg8086.a_op_const_ref(list: TAsmList; Op: TOpCG; size: TCGSize; a: tcgint; const ref: TReference);      var        tmpref: treference;        op1,op2: TAsmOp;      begin        optimize_op_const(size, op, a);        tmpref:=ref;        make_simple_ref(list,tmpref);        if size in [OS_64, OS_S64] then          internalerror(2013050801);        if size in [OS_32, OS_S32] then          begin            case Op of              OP_NONE :                begin                  { Opcode is optimized away }                end;              OP_MOVE :                begin                  { Optimized, replaced with a simple load }                  a_load_const_ref(list,size,a,ref);                end;              OP_ADD, OP_SUB:                begin                  get_32bit_ops(op, op1, op2);                  { Optimization when the low 16-bits of the constant are 0 }                  if aint(a and $FFFF) = 0 then                    begin                      inc(tmpref.offset, 2);                      { use a_op_const_ref to allow the use of inc/dec }                      a_op_const_ref(list,op,OS_16,aint(a shr 16),tmpref);                    end                  else                    begin                      list.concat(taicpu.op_const_ref(op1,S_W,aint(a and $FFFF),tmpref));                      inc(tmpref.offset, 2);                      list.concat(taicpu.op_const_ref(op2,S_W,aint(a shr 16),tmpref));                    end;                end;              OP_AND, OP_OR, OP_XOR:                begin                  { low word operation }                  if aint(a and $FFFF) = aint(0) then                    begin                      case op of                        OP_AND:                          a_load_const_ref(list,OS_16,aint(0),ref);                        OP_OR,OP_XOR:                          {do nothing};                        else                          InternalError(2013100701);                      end;                    end                  else if aint(a and $FFFF) = aint($FFFF) then                    begin                      case op of                        OP_AND:                          {do nothing};                        OP_OR:                          a_load_const_ref(list,OS_16,aint($FFFF),tmpref);                        OP_XOR:                          list.concat(taicpu.op_ref(A_NOT,S_W,tmpref));                        else                          InternalError(2013100701);                      end;                    end                  else                    a_op_const_ref(list,op,OS_16,aint(a and $FFFF),tmpref);                  { high word operation }                  inc(tmpref.offset, 2);                  if aint(a shr 16) = aint(0) then                    begin                      case op of                        OP_AND:                          a_load_const_ref(list,OS_16,aint(0),tmpref);                        OP_OR,OP_XOR:                          {do nothing};                        else                          InternalError(2013100701);                      end;                    end                  else if aint(a shr 16) = aint($FFFF) then                    begin                      case op of                        OP_AND:                          {do nothing};                        OP_OR:                          a_load_const_ref(list,OS_16,aint($FFFF),tmpref);                        OP_XOR:                          list.concat(taicpu.op_ref(A_NOT,S_W,tmpref));                        else                          InternalError(2013100701);                      end;                    end                  else                    a_op_const_ref(list,op,OS_16,aint(a shr 16),tmpref);                end;              else                internalerror(2013050802);            end;          end        else          inherited a_op_const_ref(list,Op,size,a,tmpref);      end;    procedure tcg8086.a_op_reg_reg(list: TAsmList; Op: TOpCG; size: TCGSize;      src, dst: TRegister);      var        op1, op2: TAsmOp;        hl_skip, hl_loop_start: TAsmLabel;        ai: taicpu;      begin        check_register_size(size,src);        check_register_size(size,dst);        if size in [OS_64, OS_S64] then          internalerror(2013030902);        if size in [OS_32, OS_S32] then          begin            case op of              OP_NEG:                begin                  if src<>dst then                    a_load_reg_reg(list,size,size,src,dst);                  list.concat(taicpu.op_reg(A_NOT, S_W, GetNextReg(dst)));                  list.concat(taicpu.op_reg(A_NEG, S_W, dst));                  list.concat(taicpu.op_const_reg(A_SBB, S_W,-1, GetNextReg(dst)));                end;              OP_NOT:                begin                  if src<>dst then                    a_load_reg_reg(list,size,size,src,dst);                  list.concat(taicpu.op_reg(A_NOT, S_W, dst));                  list.concat(taicpu.op_reg(A_NOT, S_W, GetNextReg(dst)));                end;              OP_ADD,OP_SUB,OP_XOR,OP_OR,OP_AND:                begin                  get_32bit_ops(op, op1, op2);                  list.concat(taicpu.op_reg_reg(op1, S_W, src, dst));                  list.concat(taicpu.op_reg_reg(op2, S_W, GetNextReg(src), GetNextReg(dst)));                end;              OP_SHR,OP_SHL,OP_SAR:                begin                  getcpuregister(list,NR_CX);                  a_load_reg_reg(list,size,OS_16,src,NR_CX);                  list.concat(taicpu.op_const_reg(A_AND,S_W,$1f,NR_CX));                  current_asmdata.getjumplabel(hl_skip);                  ai:=Taicpu.Op_Sym(A_Jcc,S_NO,hl_skip);                  ai.SetCondition(C_Z);                  ai.is_jmp:=true;                  list.concat(ai);                  current_asmdata.getjumplabel(hl_loop_start);                  a_label(list,hl_loop_start);                  case op of                    OP_SHR:                      begin                        list.concat(taicpu.op_const_reg(A_SHR,S_W,1,GetNextReg(dst)));                        list.concat(taicpu.op_const_reg(A_RCR,S_W,1,dst));                      end;                    OP_SAR:                      begin                        list.concat(taicpu.op_const_reg(A_SAR,S_W,1,GetNextReg(dst)));                        list.concat(taicpu.op_const_reg(A_RCR,S_W,1,dst));                      end;                    OP_SHL:                      begin                        list.concat(taicpu.op_const_reg(A_SHL,S_W,1,dst));                        list.concat(taicpu.op_const_reg(A_RCL,S_W,1,GetNextReg(dst)));                      end;                    else                      internalerror(2013030903);                  end;                  ai:=Taicpu.Op_Sym(A_LOOP,S_W,hl_loop_start);                  ai.is_jmp:=true;                  list.concat(ai);                  a_label(list,hl_skip);                  ungetcpuregister(list,NR_CX);                end;              else                internalerror(2013030901);            end;          end        else          inherited a_op_reg_reg(list, Op, size, src, dst);      end;    procedure tcg8086.a_op_ref_reg(list: TAsmList; Op: TOpCG; size: TCGSize; const ref: TReference; reg: TRegister);      var        tmpref  : treference;        op1, op2: TAsmOp;      begin        tmpref:=ref;        make_simple_ref(list,tmpref);        check_register_size(size,reg);        if size in [OS_64, OS_S64] then          internalerror(2013030902);        if size in [OS_32, OS_S32] then          begin            case op of              OP_ADD,OP_SUB,OP_XOR,OP_OR,OP_AND:                begin                  get_32bit_ops(op, op1, op2);                  list.concat(taicpu.op_ref_reg(op1, S_W, tmpref, reg));                  inc(tmpref.offset, 2);                  list.concat(taicpu.op_ref_reg(op2, S_W, tmpref, GetNextReg(reg)));                end;              else                internalerror(2013050701);            end;          end        else          inherited a_op_ref_reg(list,Op,size,tmpref,reg);      end;    procedure tcg8086.a_op_reg_ref(list: TAsmList; Op: TOpCG; size: TCGSize; reg: TRegister; const ref: TReference);      var        tmpref: treference;        op1,op2: TAsmOp;      begin        tmpref:=ref;        make_simple_ref(list,tmpref);        check_register_size(size,reg);        if size in [OS_64, OS_S64] then          internalerror(2013050803);        if size in [OS_32, OS_S32] then          begin            case op of              OP_NEG:                begin                  if reg<>NR_NO then                    internalerror(200109237);                  inc(tmpref.offset, 2);                  list.concat(taicpu.op_ref(A_NOT, S_W, tmpref));                  dec(tmpref.offset, 2);                  list.concat(taicpu.op_ref(A_NEG, S_W, tmpref));                  inc(tmpref.offset, 2);                  list.concat(taicpu.op_const_ref(A_SBB, S_W,-1, tmpref));                end;              OP_NOT:                begin                  if reg<>NR_NO then                    internalerror(200109237);                  list.concat(taicpu.op_ref(A_NOT, S_W, tmpref));                  inc(tmpref.offset, 2);                  list.concat(taicpu.op_ref(A_NOT, S_W, tmpref));                end;              OP_IMUL:                begin                  { this one needs a load/imul/store, which is the default }                  inherited a_op_ref_reg(list,op,size,tmpref,reg);                end;              OP_MUL,OP_DIV,OP_IDIV:                { special stuff, needs separate handling inside code }                { generator                                          }                internalerror(200109238);              OP_ADD,OP_SUB,OP_XOR,OP_OR,OP_AND:                begin                  get_32bit_ops(op, op1, op2);                  list.concat(taicpu.op_reg_ref(op1, S_W, reg, tmpref));                  inc(tmpref.offset, 2);                  list.concat(taicpu.op_reg_ref(op2, S_W, GetNextReg(reg), tmpref));                end;              else                internalerror(2013050804);            end;          end        else          inherited a_op_reg_ref(list,Op,size,reg,tmpref);      end;    procedure tcg8086.push_const(list: TAsmList; size: tcgsize; a: tcgint);      var        tmpreg: TRegister;      begin        if not (size in [OS_16,OS_S16]) then          internalerror(2013043001);        if current_settings.cputype < cpu_186 then          begin            tmpreg:=getintregister(list,size);            a_load_const_reg(list,size,a,tmpreg);            list.concat(taicpu.op_reg(A_PUSH,S_W,tmpreg));          end        else          list.concat(taicpu.op_const(A_PUSH,TCGSize2OpSize[size],a));      end;    procedure tcg8086.a_load_reg_cgpara(list : TAsmList;size : tcgsize;r : tregister;const cgpara : tcgpara);      procedure load_para_loc(r : TRegister;paraloc : PCGParaLocation);        var          ref : treference;        begin          paramanager.allocparaloc(list,paraloc);          case paraloc^.loc of             LOC_REGISTER,LOC_CREGISTER:               a_load_reg_reg(list,paraloc^.size,paraloc^.size,r,paraloc^.register);             LOC_REFERENCE,LOC_CREFERENCE:               begin                  reference_reset_base(ref,paraloc^.reference.index,paraloc^.reference.offset,2);                  a_load_reg_ref(list,paraloc^.size,paraloc^.size,r,ref);               end;             else               internalerror(2002071004);          end;        end;      var        pushsize,pushsize2 : tcgsize;      begin        check_register_size(size,r);        if use_push(cgpara) then          begin            if tcgsize2size[cgpara.Size] > 2 then              begin                if tcgsize2size[cgpara.Size] <> 4 then                  internalerror(2013031101);                if cgpara.location^.Next = nil then                  begin                    if tcgsize2size[cgpara.location^.size] <> 4 then                      internalerror(2013031101);                  end                else                  begin                    if tcgsize2size[cgpara.location^.size] <> 2 then                      internalerror(2013031101);                    if tcgsize2size[cgpara.location^.Next^.size] <> 2 then                      internalerror(2013031101);                    if cgpara.location^.Next^.Next <> nil then                      internalerror(2013031101);                  end;                if tcgsize2size[cgpara.size]>cgpara.alignment then                  pushsize:=cgpara.size                else                  pushsize:=int_cgsize(cgpara.alignment);                pushsize2 := int_cgsize(tcgsize2size[pushsize] - 2);                list.concat(taicpu.op_reg(A_PUSH,TCgsize2opsize[pushsize2],makeregsize(list,GetNextReg(r),pushsize2)));                list.concat(taicpu.op_reg(A_PUSH,S_W,makeregsize(list,r,OS_16)));              end            else              begin                cgpara.check_simple_location;                if tcgsize2size[cgpara.location^.size]>cgpara.alignment then                  pushsize:=cgpara.location^.size                else                  pushsize:=int_cgsize(cgpara.alignment);                list.concat(taicpu.op_reg(A_PUSH,TCgsize2opsize[pushsize],makeregsize(list,r,pushsize)));              end;          end        else          begin            if tcgsize2size[cgpara.Size]=4 then              begin                if (cgpara.location^.Next=nil) or                  (tcgsize2size[cgpara.location^.size]<>2) or                  (tcgsize2size[cgpara.location^.Next^.size]<>2) or                  (cgpara.location^.Next^.Next<>nil) or                  (cgpara.location^.shiftval<>0) then                  internalerror(2013031102);                load_para_loc(r,cgpara.Location);                load_para_loc(GetNextReg(r),cgpara.Location^.Next);              end            else              inherited a_load_reg_cgpara(list,size,r,cgpara);          end;      end;    procedure tcg8086.a_load_const_cgpara(list : TAsmList;size : tcgsize;a : tcgint;const cgpara : tcgpara);      var        pushsize : tcgsize;      begin        if use_push(cgpara) then          begin            if tcgsize2size[cgpara.Size] > 2 then              begin                if tcgsize2size[cgpara.Size] <> 4 then                  internalerror(2013031101);                if cgpara.location^.Next = nil then                  begin                    if tcgsize2size[cgpara.location^.size] <> 4 then                      internalerror(2013031101);                  end                else                  begin                    if tcgsize2size[cgpara.location^.size] <> 2 then                      internalerror(2013031101);                    if tcgsize2size[cgpara.location^.Next^.size] <> 2 then                      internalerror(2013031101);                    if cgpara.location^.Next^.Next <> nil then                      internalerror(2013031101);                  end;                if (cgpara.alignment <> 4) and (cgpara.alignment <> 2) then                  internalerror(2013031101);                push_const(list,OS_16,a shr 16);                push_const(list,OS_16,a and $FFFF);              end            else              begin                cgpara.check_simple_location;                if tcgsize2size[cgpara.location^.size]>cgpara.alignment then                  pushsize:=cgpara.location^.size                else                  pushsize:=int_cgsize(cgpara.alignment);                push_const(list,pushsize,a);              end;          end        else          inherited a_load_const_cgpara(list,size,a,cgpara);      end;    procedure tcg8086.a_load_ref_cgpara(list : TAsmList;size : tcgsize;const r : treference;const cgpara : tcgpara);        procedure pushdata(paraloc:pcgparalocation;ofs:tcgint);        var          pushsize : tcgsize;          opsize : topsize;          tmpreg   : tregister;          href,tmpref: treference;        begin          if not assigned(paraloc) then            exit;          if (paraloc^.loc<>LOC_REFERENCE) or             (paraloc^.reference.index<>NR_STACK_POINTER_REG) or             (tcgsize2size[paraloc^.size]>4) then            internalerror(200501162);          { Pushes are needed in reverse order, add the size of the            current location to the offset where to load from. This            prevents wrong calculations for the last location when            the size is not a power of 2 }          if assigned(paraloc^.next) then            pushdata(paraloc^.next,ofs+tcgsize2size[paraloc^.size]);          { Push the data starting at ofs }          href:=r;          inc(href.offset,ofs);          if tcgsize2size[paraloc^.size]>cgpara.alignment then            pushsize:=paraloc^.size          else            pushsize:=int_cgsize(cgpara.alignment);          opsize:=TCgsize2opsize[pushsize];          { for go32v2 we obtain OS_F32,            but pushs is not valid, we need pushl }          if opsize=S_FS then            opsize:=S_W;          if tcgsize2size[paraloc^.size]<cgpara.alignment then            begin              tmpreg:=getintregister(list,pushsize);              a_load_ref_reg(list,paraloc^.size,pushsize,href,tmpreg);              list.concat(taicpu.op_reg(A_PUSH,opsize,tmpreg));            end          else            begin              make_simple_ref(list,href);              if tcgsize2size[pushsize] > 2 then                begin                  tmpref := href;                  Inc(tmpref.offset, 2);                  list.concat(taicpu.op_ref(A_PUSH,TCgsize2opsize[int_cgsize(tcgsize2size[pushsize]-2)],tmpref));                end;              list.concat(taicpu.op_ref(A_PUSH,opsize,href));            end;        end;      var        len : tcgint;        href : treference;      begin        { cgpara.size=OS_NO requires a copy on the stack }        if use_push(cgpara) then          begin            { Record copy? }            if (cgpara.size in [OS_NO,OS_F64]) or (size=OS_NO) then              begin                cgpara.check_simple_location;                len:=align(cgpara.intsize,cgpara.alignment);                g_stackpointer_alloc(list,len);                reference_reset_base(href,NR_STACK_POINTER_REG,0,4);                g_concatcopy(list,r,href,len);              end            else              begin                if tcgsize2size[cgpara.size]<>tcgsize2size[size] then                  internalerror(200501161);                { We need to push the data in reverse order,                  therefor we use a recursive algorithm }                pushdata(cgpara.location,0);              end          end        else          inherited a_load_ref_cgpara(list,size,r,cgpara);      end;    procedure tcg8086.a_loadaddr_ref_cgpara(list : TAsmList;const r : treference;const cgpara : tcgpara);      var        tmpreg : tregister;        tmpref : treference;      begin        with r do          begin            if use_push(cgpara) then              begin                if tcgsize2size[cgpara.Size] > 2 then                  begin                    if tcgsize2size[cgpara.Size] <> 4 then                      internalerror(2014032401);                    if cgpara.location^.Next = nil then                      begin                        if tcgsize2size[cgpara.location^.size] <> 4 then                          internalerror(2014032401);                      end                    else                      begin                        if tcgsize2size[cgpara.location^.size] <> 2 then                          internalerror(2014032401);                        if tcgsize2size[cgpara.location^.Next^.size] <> 2 then                          internalerror(2014032401);                        if cgpara.location^.Next^.Next <> nil then                          internalerror(2014032401);                      end;                    if cgpara.alignment > 4 then                      internalerror(2014032401);                    if segment<>NR_NO then                      begin                        list.concat(Taicpu.op_reg(A_PUSH,S_W,segment));                        tmpref:=r;                        tmpref.segment:=NR_NO;                        tmpreg:=getaddressregister(list);                        a_loadaddr_ref_reg(list,tmpref,tmpreg);                        list.concat(taicpu.op_reg(A_PUSH,S_W,tmpreg));                      end                    else                      begin                        if (base=NR_NO) and (index=NR_NO) then                          begin                            if assigned(symbol) then                              begin                                tmpref:=r;                                tmpref.refaddr:=addr_seg;                                tmpref.offset:=0;                                if current_settings.cputype < cpu_186 then                                  begin                                    tmpreg:=getaddressregister(list);                                    a_load_ref_reg(list,OS_16,OS_16,tmpref,tmpreg);                                    list.concat(taicpu.op_reg(A_PUSH,S_W,tmpreg));                                  end                                else                                  list.concat(Taicpu.Op_ref(A_PUSH,S_W,tmpref));                                if current_settings.cputype < cpu_186 then                                  begin                                    tmpreg:=getaddressregister(list);                                    a_loadaddr_ref_reg(list,r,tmpreg);                                    list.concat(taicpu.op_reg(A_PUSH,S_W,tmpreg));                                  end                                else                                  list.concat(Taicpu.Op_sym_ofs(A_PUSH,S_W,symbol,offset));                              end                            else                              internalerror(2014032402);                          end                        else if assigned(symbol) then                          begin                            reference_reset_symbol(tmpref,r.symbol,0,0);                            tmpref.refaddr:=addr_seg;                            if current_settings.cputype < cpu_186 then                              begin                                tmpreg:=getaddressregister(list);                                a_load_ref_reg(list,OS_16,OS_16,tmpref,tmpreg);                                list.concat(taicpu.op_reg(A_PUSH,S_W,tmpreg));                              end                            else                              list.concat(Taicpu.Op_ref(A_PUSH,S_W,tmpref));                            tmpreg:=getaddressregister(list);                            a_loadaddr_ref_reg(list,r,tmpreg);                            list.concat(taicpu.op_reg(A_PUSH,S_W,tmpreg));                          end                        else if base=NR_BP then                          begin                            list.concat(Taicpu.op_reg(A_PUSH,S_W,NR_SS));                            tmpreg:=getaddressregister(list);                            a_loadaddr_ref_reg(list,r,tmpreg);                            list.concat(taicpu.op_reg(A_PUSH,S_W,tmpreg));                          end                        else                          internalerror(2014032403);                      end;                  end                else                  begin                    cgpara.check_simple_location;                    tmpref:=r;                    tmpref.segment:=NR_NO;                    with tmpref do                      begin                        if (base=NR_NO) and (index=NR_NO) then                          begin                            if assigned(symbol) then                              begin                                if current_settings.cputype < cpu_186 then                                  begin                                    tmpreg:=getaddressregister(list);                                    a_loadaddr_ref_reg(list,tmpref,tmpreg);                                    list.concat(taicpu.op_reg(A_PUSH,S_W,tmpreg));                                  end                                else                                  list.concat(Taicpu.Op_sym_ofs(A_PUSH,S_W,symbol,offset));                              end                            else                              push_const(list,OS_16,offset);                          end                        else if (base=NR_NO) and (index<>NR_NO) and                                (offset=0) and (scalefactor=0) and (symbol=nil) then                          list.concat(Taicpu.Op_reg(A_PUSH,S_W,index))                        else if (base<>NR_NO) and (index=NR_NO) and                                (offset=0) and (symbol=nil) then                          list.concat(Taicpu.Op_reg(A_PUSH,S_W,base))                        else                          begin                            tmpreg:=getaddressregister(list);                            a_loadaddr_ref_reg(list,tmpref,tmpreg);                            list.concat(taicpu.op_reg(A_PUSH,S_W,tmpreg));                          end;                      end;                end;              end            else              inherited a_loadaddr_ref_cgpara(list,r,cgpara);          end;      end;    procedure tcg8086.a_load_const_reg(list : TAsmList; tosize: tcgsize; a : tcgint;reg : tregister);    begin      check_register_size(tosize,reg);      if tosize in [OS_S32,OS_32] then        begin          list.concat(taicpu.op_const_reg(A_MOV,S_W,longint(a and $ffff),reg));          list.concat(taicpu.op_const_reg(A_MOV,S_W,longint(a shr 16),GetNextReg(reg)));        end      else        list.concat(taicpu.op_const_reg(A_MOV,TCGSize2OpSize[tosize],a,reg));    end;    procedure tcg8086.a_load_const_ref(list : TAsmList; tosize: tcgsize; a : tcgint;const ref : treference);      var        tmpref : treference;      begin        tmpref:=ref;        make_simple_ref(list,tmpref);        if tosize in [OS_S32,OS_32] then          begin            a_load_const_ref(list,OS_16,longint(a and $ffff),tmpref);            inc(tmpref.offset,2);            a_load_const_ref(list,OS_16,longint(a shr 16),tmpref);          end        else          list.concat(taicpu.op_const_ref(A_MOV,TCGSize2OpSize[tosize],a,tmpref));      end;    procedure tcg8086.a_load_reg_ref(list : TAsmList;fromsize,tosize: tcgsize; reg : tregister;const ref : treference);      var        tmpreg  : tregister;        tmpref  : treference;      begin        tmpref:=ref;        make_simple_ref(list,tmpref);        check_register_size(fromsize,reg);        case tosize of          OS_8,OS_S8:            if fromsize in [OS_8,OS_S8] then              list.concat(taicpu.op_reg_ref(A_MOV, S_B, reg, tmpref))            else              internalerror(2013030310);          OS_16,OS_S16:            case fromsize of              OS_8,OS_S8:                begin                  tmpreg:=getintregister(list,tosize);                  a_load_reg_reg(list,fromsize,tosize,reg,tmpreg);                  a_load_reg_ref(list,tosize,tosize,tmpreg,tmpref);                end;              OS_16,OS_S16:                begin                  list.concat(taicpu.op_reg_ref(A_MOV, S_W, reg, tmpref));                end;              else                internalerror(2013030312);            end;          OS_32,OS_S32:            case fromsize of              OS_8,OS_S8,OS_S16:                begin                  tmpreg:=getintregister(list,tosize);                  a_load_reg_reg(list,fromsize,tosize,reg,tmpreg);                  a_load_reg_ref(list,tosize,tosize,tmpreg,tmpref);                end;              OS_16:                begin                  list.concat(taicpu.op_reg_ref(A_MOV, S_W, reg, tmpref));                  inc(tmpref.offset, 2);                  list.concat(taicpu.op_const_ref(A_MOV, S_W, 0, tmpref));                end;              OS_32,OS_S32:                begin                  list.concat(taicpu.op_reg_ref(A_MOV, S_W, reg, tmpref));                  inc(tmpref.offset, 2);                  list.concat(taicpu.op_reg_ref(A_MOV, S_W, GetNextReg(reg), tmpref));                end;              else                internalerror(2013030313);            end;          else            internalerror(2013030311);        end;      end;    procedure tcg8086.a_load_ref_reg(list : TAsmList;fromsize,tosize: tcgsize;const ref : treference;reg : tregister);        procedure add_mov(instr: Taicpu);          begin            { Notify the register allocator that we have written a move instruction so              it can try to eliminate it. }            if (instr.oper[0]^.reg<>current_procinfo.framepointer) and (instr.oper[0]^.reg<>NR_STACK_POINTER_REG) then              add_move_instruction(instr);            list.concat(instr);          end;      var        tmpref  : treference;      begin        tmpref:=ref;        make_simple_ref(list,tmpref);        check_register_size(tosize,reg);        if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then          internalerror(2011021307);{        if tcgsize2size[tosize]<=tcgsize2size[fromsize] then          fromsize:=tosize;}        case tosize of          OS_8,OS_S8:            if fromsize in [OS_8,OS_S8] then              list.concat(taicpu.op_ref_reg(A_MOV, S_B, tmpref, reg))            else              internalerror(2013030210);          OS_16,OS_S16:            case fromsize of              OS_8:                begin                  reg := makeregsize(list, reg, OS_8);                  list.concat(taicpu.op_ref_reg(A_MOV, S_B, tmpref, reg));                  setsubreg(reg, R_SUBH);                  list.concat(taicpu.op_const_reg(A_MOV, S_B, 0, reg));                  makeregsize(list, reg, OS_16);                end;              OS_S8:                begin                  getcpuregister(list, NR_AX);                  list.concat(taicpu.op_ref_reg(A_MOV, S_B, tmpref, NR_AL));                  list.concat(taicpu.op_none(A_CBW));                  add_mov(taicpu.op_reg_reg(A_MOV, S_W, NR_AX, reg));                  ungetcpuregister(list, NR_AX);                end;              OS_16,OS_S16:                list.concat(taicpu.op_ref_reg(A_MOV, S_W, tmpref, reg));              else                internalerror(2013030212);            end;          OS_32,OS_S32:            case fromsize of              OS_8:                begin                  list.concat(taicpu.op_const_reg(A_MOV,S_W,0,GetNextReg(reg)));                  reg := makeregsize(list, reg, OS_8);                  list.concat(taicpu.op_ref_reg(A_MOV, S_B, tmpref, reg));                  setsubreg(reg, R_SUBH);                  list.concat(taicpu.op_const_reg(A_MOV, S_B, 0, reg));                  makeregsize(list, reg, OS_16);                end;              OS_S8:                begin                  getcpuregister(list, NR_AX);                  list.concat(taicpu.op_ref_reg(A_MOV, S_B, tmpref, NR_AL));                  getcpuregister(list, NR_DX);                  list.concat(taicpu.op_none(A_CBW));                  list.concat(taicpu.op_none(A_CWD));                  add_mov(taicpu.op_reg_reg(A_MOV, S_W, NR_AX, reg));                  ungetcpuregister(list, NR_AX);                  add_mov(taicpu.op_reg_reg(A_MOV, S_W, NR_DX, GetNextReg(reg)));                  ungetcpuregister(list, NR_DX);                end;              OS_16:                begin                  list.concat(taicpu.op_ref_reg(A_MOV, S_W, tmpref, reg));                  list.concat(taicpu.op_const_reg(A_MOV,S_W,0,GetNextReg(reg)));                end;              OS_S16:                begin                  getcpuregister(list, NR_AX);                  list.concat(taicpu.op_ref_reg(A_MOV, S_W, tmpref, NR_AX));                  getcpuregister(list, NR_DX);                  list.concat(taicpu.op_none(A_CWD));                  ungetcpuregister(list, NR_AX);                  add_mov(taicpu.op_reg_reg(A_MOV, S_W, NR_AX, reg));                  ungetcpuregister(list, NR_DX);                  add_mov(taicpu.op_reg_reg(A_MOV, S_W, NR_DX, GetNextReg(reg)));                end;              OS_32,OS_S32:                begin                  list.concat(taicpu.op_ref_reg(A_MOV, S_W, tmpref, reg));                  inc(tmpref.offset, 2);                  list.concat(taicpu.op_ref_reg(A_MOV, S_W, tmpref, GetNextReg(reg)));                end;              else                internalerror(2013030213);            end;          else            internalerror(2013030211);        end;      end;    procedure tcg8086.a_load_reg_reg(list : TAsmList;fromsize,tosize: tcgsize;reg1,reg2 : tregister);        procedure add_mov(instr: Taicpu);          begin            { Notify the register allocator that we have written a move instruction so              it can try to eliminate it. }            if (instr.oper[0]^.reg<>current_procinfo.framepointer) and (instr.oper[0]^.reg<>NR_STACK_POINTER_REG) then              add_move_instruction(instr);            list.concat(instr);          end;      begin        check_register_size(fromsize,reg1);        check_register_size(tosize,reg2);        if tcgsize2size[fromsize]>tcgsize2size[tosize] then          begin            if tosize in [OS_32, OS_S32] then              internalerror(2013031801);            reg1:=makeregsize(list,reg1,tosize);            fromsize:=tosize;          end;        if (reg1<>reg2) or (fromsize<>tosize) then          begin            case tosize of              OS_8,OS_S8:                if fromsize in [OS_8,OS_S8] then                  begin                    if reg1<>reg2 then                      add_mov(taicpu.op_reg_reg(A_MOV, S_B, reg1, reg2));                  end                else                  internalerror(2013030210);              OS_16,OS_S16:                case fromsize of                  OS_8:                    begin                      reg2 := makeregsize(list, reg2, OS_8);                      if reg1<>reg2 then                        add_mov(taicpu.op_reg_reg(A_MOV, S_B, reg1, reg2));                      setsubreg(reg2,R_SUBH);                      list.concat(taicpu.op_const_reg(A_MOV, S_B, 0, reg2));                      makeregsize(list, reg2, OS_16);                    end;                  OS_S8:                    begin                      getcpuregister(list, NR_AX);                      add_mov(taicpu.op_reg_reg(A_MOV, S_B, reg1, NR_AL));                      list.concat(taicpu.op_none(A_CBW));                      add_mov(taicpu.op_reg_reg(A_MOV, S_W, NR_AX, reg2));                      ungetcpuregister(list, NR_AX);                    end;                  OS_16,OS_S16:                    begin                      if reg1<>reg2 then                        add_mov(taicpu.op_reg_reg(A_MOV, S_W, reg1, reg2));                    end                  else                    internalerror(2013030212);                end;              OS_32,OS_S32:                case fromsize of                  OS_8:                    begin                      list.concat(taicpu.op_const_reg(A_MOV, S_W, 0, GetNextReg(reg2)));                      reg2 := makeregsize(list, reg2, OS_8);                      if reg1<>reg2 then                        add_mov(taicpu.op_reg_reg(A_MOV, S_B, reg1, reg2));                      setsubreg(reg2,R_SUBH);                      list.concat(taicpu.op_const_reg(A_MOV, S_B, 0, reg2));                      makeregsize(list, reg2, OS_16);                    end;                  OS_S8:                    begin                      getcpuregister(list, NR_AX);                      add_mov(taicpu.op_reg_reg(A_MOV, S_B, reg1, NR_AL));                      getcpuregister(list, NR_DX);                      list.concat(taicpu.op_none(A_CBW));                      list.concat(taicpu.op_none(A_CWD));                      add_mov(taicpu.op_reg_reg(A_MOV, S_W, NR_AX, reg2));                      ungetcpuregister(list, NR_AX);                      add_mov(taicpu.op_reg_reg(A_MOV, S_W, NR_DX, GetNextReg(reg2)));                      ungetcpuregister(list, NR_DX);                    end;                  OS_16:                    begin                      if reg1<>reg2 then                        add_mov(taicpu.op_reg_reg(A_MOV, S_W, reg1, reg2));                      list.concat(taicpu.op_const_reg(A_MOV,S_W,0,GetNextReg(reg2)));                    end;                  OS_S16:                    begin                      getcpuregister(list, NR_AX);                      add_mov(taicpu.op_reg_reg(A_MOV, S_W, reg1, NR_AX));                      getcpuregister(list, NR_DX);                      list.concat(taicpu.op_none(A_CWD));                      if reg1<>reg2 then                        add_mov(taicpu.op_reg_reg(A_MOV, S_W, NR_AX, reg2));                      ungetcpuregister(list, NR_AX);                      add_mov(taicpu.op_reg_reg(A_MOV, S_W, NR_DX, GetNextReg(reg2)));                      ungetcpuregister(list, NR_DX);                    end;                  OS_32,OS_S32:                    begin                      if reg1<>reg2 then                        begin                          add_mov(taicpu.op_reg_reg(A_MOV, S_W, reg1, reg2));                          add_mov(taicpu.op_reg_reg(A_MOV, S_W, GetNextReg(reg1), GetNextReg(reg2)));                        end;                    end;                  else                    internalerror(2013030213);                end;              else                internalerror(2013030211);            end;          end;      end;    procedure tcg8086.a_cmp_const_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; a: tcgint; reg: tregister; l: tasmlabel);      var        hl_skip: TAsmLabel;      begin        if size in [OS_32, OS_S32] then          begin            if (longint(a shr 16) = 0) then              list.concat(taicpu.op_reg_reg(A_TEST,S_W,GetNextReg(reg),GetNextReg(reg)))            else              list.concat(taicpu.op_const_reg(A_CMP,S_W,longint(a shr 16),GetNextReg(reg)));            current_asmdata.getjumplabel(hl_skip);            gen_cmp32_jmp1(list, cmp_op, hl_skip, l);            if (longint(a and $ffff) = 0) then              list.concat(taicpu.op_reg_reg(A_TEST,S_W,reg,reg))            else              list.concat(taicpu.op_const_reg(A_CMP,S_W,longint(a and $ffff),reg));            gen_cmp32_jmp2(list, cmp_op, hl_skip, l);            a_label(list,hl_skip);          end        else          inherited a_cmp_const_reg_label(list, size, cmp_op, a, reg, l);      end;    procedure tcg8086.a_cmp_const_ref_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; a: tcgint; const ref: treference; l: tasmlabel);      var        tmpref: treference;        hl_skip: TAsmLabel;      begin        if size in [OS_32, OS_S32] then          begin            tmpref:=ref;            make_simple_ref(list,tmpref);            inc(tmpref.offset,2);            list.concat(taicpu.op_const_ref(A_CMP,S_W,longint(a shr 16),tmpref));            current_asmdata.getjumplabel(hl_skip);            gen_cmp32_jmp1(list, cmp_op, hl_skip, l);            dec(tmpref.offset,2);            list.concat(taicpu.op_const_ref(A_CMP,S_W,longint(a and $ffff),tmpref));            gen_cmp32_jmp2(list, cmp_op, hl_skip, l);            a_label(list,hl_skip);          end        else          inherited a_cmp_const_ref_label(list, size, cmp_op, a, ref, l);      end;    procedure tcg8086.a_cmp_reg_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; reg1, reg2: tregister; l: tasmlabel);      var        hl_skip: TAsmLabel;      begin        if size in [OS_32, OS_S32] then          begin            check_register_size(size,reg1);            check_register_size(size,reg2);            list.concat(taicpu.op_reg_reg(A_CMP,S_W,GetNextReg(reg1),GetNextReg(reg2)));            current_asmdata.getjumplabel(hl_skip);            gen_cmp32_jmp1(list, cmp_op, hl_skip, l);            list.concat(taicpu.op_reg_reg(A_CMP,S_W,reg1,reg2));            gen_cmp32_jmp2(list, cmp_op, hl_skip, l);            a_label(list,hl_skip);          end        else          inherited a_cmp_reg_reg_label(list, size, cmp_op, reg1, reg2, l);      end;    procedure tcg8086.a_cmp_ref_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; const ref: treference; reg: tregister; l: tasmlabel);      var        tmpref: treference;        hl_skip: TAsmLabel;      begin        if size in [OS_32, OS_S32] then          begin            tmpref:=ref;            make_simple_ref(list,tmpref);            check_register_size(size,reg);            inc(tmpref.offset,2);            list.concat(taicpu.op_ref_reg(A_CMP,S_W,tmpref,GetNextReg(reg)));            current_asmdata.getjumplabel(hl_skip);            gen_cmp32_jmp1(list, cmp_op, hl_skip, l);            dec(tmpref.offset,2);            list.concat(taicpu.op_ref_reg(A_CMP,S_W,tmpref,reg));            gen_cmp32_jmp2(list, cmp_op, hl_skip, l);            a_label(list,hl_skip);          end        else          inherited a_cmp_ref_reg_label(list, size, cmp_op, ref, reg, l);      end;    procedure tcg8086.a_cmp_reg_ref_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; reg: tregister; const ref: treference; l: tasmlabel);      var        tmpref: treference;        hl_skip: TAsmLabel;      begin        if size in [OS_32, OS_S32] then          begin            tmpref:=ref;            make_simple_ref(list,tmpref);            check_register_size(size,reg);            inc(tmpref.offset,2);            list.concat(taicpu.op_reg_ref(A_CMP,S_W,GetNextReg(reg),tmpref));            current_asmdata.getjumplabel(hl_skip);            gen_cmp32_jmp1(list, cmp_op, hl_skip, l);            dec(tmpref.offset,2);            list.concat(taicpu.op_reg_ref(A_CMP,S_W,reg,tmpref));            gen_cmp32_jmp2(list, cmp_op, hl_skip, l);            a_label(list,hl_skip);          end        else          inherited a_cmp_reg_ref_label(list, size, cmp_op, reg, ref, l);      end;    procedure tcg8086.gen_cmp32_jmp1(list: TAsmList; cmp_op: topcmp; l_skip, l_target: TAsmLabel);      begin        case cmp_op of          OC_EQ:            a_jmp_cond(list, OC_NE, l_skip);          OC_NE:            a_jmp_cond(list, OC_NE, l_target);          OC_GT,OC_GTE:            begin              a_jmp_cond(list, OC_GT, l_target);              a_jmp_cond(list, OC_LT, l_skip);            end;          OC_LT,OC_LTE:            begin              a_jmp_cond(list, OC_LT, l_target);              a_jmp_cond(list, OC_GT, l_skip);            end;          OC_B,OC_BE:            begin              a_jmp_cond(list, OC_B, l_target);              a_jmp_cond(list, OC_A, l_skip);            end;          OC_A,OC_AE:            begin              a_jmp_cond(list, OC_A, l_target);              a_jmp_cond(list, OC_B, l_skip);            end;          else            internalerror(2014010305);        end;      end;    procedure tcg8086.gen_cmp32_jmp2(list: TAsmList; cmp_op: topcmp; l_skip, l_target: TAsmLabel);      begin        case cmp_op of          OC_EQ:            a_jmp_cond(list, OC_EQ, l_target);          OC_GT:            a_jmp_cond(list, OC_A, l_target);          OC_LT:            a_jmp_cond(list, OC_B, l_target);          OC_GTE:            a_jmp_cond(list, OC_AE, l_target);          OC_LTE:            a_jmp_cond(list, OC_BE, l_target);          OC_NE:            a_jmp_cond(list, OC_NE, l_target);          OC_BE:            a_jmp_cond(list, OC_BE, l_target);          OC_B:            a_jmp_cond(list, OC_B, l_target);          OC_AE:            a_jmp_cond(list, OC_AE, l_target);          OC_A:            a_jmp_cond(list, OC_A, l_target);          else            internalerror(2014010306);        end;      end;    procedure tcg8086.g_flags2reg(list: TAsmList; size: TCgSize; const f: tresflags; reg: TRegister);      var        ai : taicpu;        hreg16 : tregister;        hl_skip: TAsmLabel;        invf: TResFlags;        tmpsize: TCgSize;      begin        invf := f;        inverse_flags(invf);        case size of          OS_8,OS_S8:            begin              tmpsize:=OS_8;              list.concat(Taicpu.op_const_reg(A_MOV, S_B, 0, reg));            end;          OS_16,OS_S16,OS_32,OS_S32:            begin              tmpsize:=OS_16;              list.concat(Taicpu.op_const_reg(A_MOV, S_W, 0, reg));            end;          else            internalerror(2013123101);        end;        current_asmdata.getjumplabel(hl_skip);        { we can't just forward invf to a_jmp_flags for FA,FAE,FB and FBE, because          in the case of NaNs:           not(F_FA )<>F_FBE           not(F_FAE)<>F_FB           not(F_FB )<>F_FAE           not(F_FBE)<>F_FA        }        case f of          F_FA,F_FAE:            invf:=FPUFlags2Flags[invf];          F_FB,F_FBE:            begin              ai:=Taicpu.op_sym(A_Jcc,S_NO,hl_skip);              ai.SetCondition(C_P);              ai.is_jmp:=true;              list.concat(ai);              invf:=FPUFlags2Flags[invf];            end;        end;        a_jmp_flags(list,invf,hl_skip);        { 16-bit INC is shorter than 8-bit }        hreg16:=makeregsize(list,reg,OS_16);        list.concat(Taicpu.op_reg(A_INC, S_W, hreg16));        makeregsize(list,hreg16,tmpsize);        a_label(list,hl_skip);        a_load_reg_reg(list,tmpsize,size,reg,reg);      end;    procedure tcg8086.g_flags2ref(list: TAsmList; size: TCgSize; const f: tresflags; const ref: TReference);      var        tmpreg : tregister;        tmpregsize: TCgSize;        tmpref: treference;      begin        if size in [OS_8,OS_S8,OS_16,OS_S16] then          tmpregsize:=size        else          tmpregsize:=OS_16;        tmpreg:=getintregister(list,tmpregsize);        g_flags2reg(list,tmpregsize,f,tmpreg);        tmpref:=ref;        make_simple_ref(list,tmpref);        if size in [OS_64,OS_S64] then          begin            a_load_reg_ref(list,tmpregsize,OS_32,tmpreg,tmpref);            inc(tmpref.offset,4);            a_load_const_ref(list,OS_32,0,tmpref);          end        else          a_load_reg_ref(list,tmpregsize,size,tmpreg,tmpref);      end;    procedure tcg8086.g_stackpointer_alloc(list : TAsmList;localsize: longint);      begin        if localsize>0 then          list.concat(Taicpu.Op_const_reg(A_SUB,S_W,localsize,NR_STACK_POINTER_REG));      end;    procedure tcg8086.g_proc_exit(list : TAsmList;parasize:longint;nostackframe:boolean);      var        stacksize : longint;        ret_instr: TAsmOp;      begin        if is_proc_far(current_procinfo.procdef) then          ret_instr:=A_RETF        else          ret_instr:=A_RET;        { MMX needs to call EMMS }        if assigned(rg[R_MMXREGISTER]) and           (rg[R_MMXREGISTER].uses_registers) then          list.concat(Taicpu.op_none(A_EMMS,S_NO));        { remove stackframe }        if not nostackframe then          begin            if (current_procinfo.framepointer=NR_STACK_POINTER_REG) then              begin                stacksize:=current_procinfo.calc_stackframe_size;                if (target_info.stackalign>4) and                   ((stacksize <> 0) or                    (pi_do_call in current_procinfo.flags) or                    { can't detect if a call in this case -> use nostackframe }                    { if you (think you) know what you are doing              }                    (po_assembler in current_procinfo.procdef.procoptions)) then                  stacksize := align(stacksize+sizeof(aint),target_info.stackalign) - sizeof(aint);                if (stacksize<>0) then                  cg.a_op_const_reg(list,OP_ADD,OS_ADDR,stacksize,current_procinfo.framepointer);              end            else              generate_leave(list);            list.concat(tai_regalloc.dealloc(current_procinfo.framepointer,nil));          end;        { return from interrupt }        if po_interrupt in current_procinfo.procdef.procoptions then          begin            list.concat(Taicpu.Op_reg(A_POP,S_W,NR_ES));            list.concat(Taicpu.Op_reg(A_POP,S_W,NR_DS));            list.concat(Taicpu.Op_reg(A_POP,S_W,NR_DI));            list.concat(Taicpu.Op_reg(A_POP,S_W,NR_SI));            list.concat(Taicpu.Op_reg(A_POP,S_W,NR_DX));            list.concat(Taicpu.Op_reg(A_POP,S_W,NR_CX));            list.concat(Taicpu.Op_reg(A_POP,S_W,NR_BX));            list.concat(Taicpu.Op_reg(A_POP,S_W,NR_AX));            list.concat(Taicpu.Op_none(A_IRET,S_NO));          end        { Routines with the poclearstack flag set use only a ret }        else if (current_procinfo.procdef.proccalloption in clearstack_pocalls) and                (not paramanager.use_fixed_stack)  then         begin           { complex return values are removed from stack in C code PM }           { but not on win32 }           { and not for safecall with hidden exceptions, because the result }           { wich contains the exception is passed in EAX }           if (target_info.system <> system_i386_win32) and              not ((current_procinfo.procdef.proccalloption = pocall_safecall) and               (tf_safecall_exceptions in target_info.flags)) and              paramanager.ret_in_param(current_procinfo.procdef.returndef,                                       current_procinfo.procdef) then             list.concat(Taicpu.Op_const(ret_instr,S_W,sizeof(aint)))           else             list.concat(Taicpu.Op_none(ret_instr,S_NO));         end        { ... also routines with parasize=0 }        else if (parasize=0) then         list.concat(Taicpu.Op_none(ret_instr,S_NO))        else         begin           { parameters are limited to 65535 bytes because ret allows only imm16 }           if (parasize>65535) then             CGMessage(cg_e_parasize_too_big);           list.concat(Taicpu.Op_const(ret_instr,S_W,parasize));         end;      end;    procedure tcg8086.g_copyvaluepara_openarray(list : TAsmList;const ref:treference;const lenloc:tlocation;elesize:tcgint;destreg:tregister);      var        power  : longint;        opsize : topsize;        saved_ds: Boolean;      begin        { get stack space }        getcpuregister(list,NR_DI);        a_load_loc_reg(list,OS_INT,lenloc,NR_DI);        list.concat(Taicpu.op_reg(A_INC,S_W,NR_DI));        { Now DI contains (high+1). }        { special case handling for elesize=2:          set CX = (high+1) instead of CX = (high+1)*elesize.          This allows us to avoid the SHR later. }        if elesize=2 then          begin            { Now DI contains (high+1). Copy it to CX for later use. }            getcpuregister(list,NR_CX);            list.concat(Taicpu.op_reg_reg(A_MOV,S_W,NR_DI,NR_CX));          end;        { DI := DI * elesize }        if (elesize<>1) then         begin           if ispowerof2(elesize, power) then             a_op_const_reg(list,OP_SHL,OS_16,power,NR_DI)           else             a_op_const_reg(list,OP_IMUL,OS_16,elesize,NR_DI);         end;        if elesize<>2 then          begin            { Now DI contains (high+1)*elesize. Copy it to CX for later use. }            getcpuregister(list,NR_CX);            list.concat(Taicpu.op_reg_reg(A_MOV,S_W,NR_DI,NR_CX));          end;        { If we were probing pages, EDI=(size mod pagesize) and ESP is decremented          by (size div pagesize)*pagesize, otherwise EDI=size.          Either way, subtracting EDI from ESP will set ESP to desired final value. }        list.concat(Taicpu.op_reg_reg(A_SUB,S_W,NR_DI,NR_SP));        { align stack on 2 bytes }        list.concat(Taicpu.op_const_reg(A_AND,S_W,aint($fffe),NR_SP));        { load destination, don't use a_load_reg_reg, that will add a move instruction          that can confuse the reg allocator }        list.concat(Taicpu.Op_reg_reg(A_MOV,S_W,NR_SP,NR_DI));{$ifdef volatile_es}        list.concat(taicpu.op_reg(A_PUSH,S_W,NR_SS));        list.concat(taicpu.op_reg(A_POP,S_W,NR_ES));{$endif volatile_es}        { Allocate SI and load it with source }        getcpuregister(list,NR_SI);        if ((ref.segment=NR_NO) and (segment_regs_equal(NR_SS,NR_DS) or (ref.base<>NR_BP))) or           (is_segment_reg(ref.segment) and segment_regs_equal(ref.segment,NR_DS)) then          begin            hlcg.a_loadaddr_ref_reg(list,voidnearpointertype,voidnearpointertype,ref,NR_SI);            saved_ds:=false;          end        else          begin            hlcg.a_loadaddr_ref_reg(list,voidnearpointertype,voidnearpointertype,ref,NR_SI);            list.concat(taicpu.op_reg(A_PUSH,S_W,NR_DS));            saved_ds:=true;            if ref.segment<>NR_NO then              list.concat(taicpu.op_reg(A_PUSH,S_W,ref.segment))            else if ref.base=NR_BP then              list.concat(taicpu.op_reg(A_PUSH,S_W,NR_SS))            else              internalerror(2014040403);            list.concat(taicpu.op_reg(A_POP,S_W,NR_DS));          end;        { calculate size }        opsize:=S_B;        if elesize=2 then          begin            opsize:=S_W;            { CX is already number of words, so no need to SHL/SHR }          end        else if (elesize and 1)=0 then          begin            opsize:=S_W;            { CX is number of bytes, convert to words }            list.concat(Taicpu.op_const_reg(A_SHR,S_W,1,NR_CX))          end;        if ts_cld in current_settings.targetswitches then          list.concat(Taicpu.op_none(A_CLD,S_NO));        if (opsize=S_B) and not (cs_opt_size in current_settings.optimizerswitches) then          begin            { SHR CX,1 moves the lowest (odd/even) bit to the carry flag }            list.concat(Taicpu.op_const_reg(A_SHR,S_W,1,NR_CX));            list.concat(Taicpu.op_none(A_REP,S_NO));            list.concat(Taicpu.op_none(A_MOVSW,S_NO));            { ADC CX,CX will set CX to 1 if the number of bytes was odd }            list.concat(Taicpu.op_reg_reg(A_ADC,S_W,NR_CX,NR_CX));            list.concat(Taicpu.op_none(A_REP,S_NO));            list.concat(Taicpu.op_none(A_MOVSB,S_NO));          end        else          begin            list.concat(Taicpu.op_none(A_REP,S_NO));            case opsize of              S_B : list.concat(Taicpu.Op_none(A_MOVSB,S_NO));              S_W : list.concat(Taicpu.Op_none(A_MOVSW,S_NO));            end;          end;        ungetcpuregister(list,NR_DI);        ungetcpuregister(list,NR_CX);        ungetcpuregister(list,NR_SI);        if saved_ds then          list.concat(taicpu.op_reg(A_POP,S_W,NR_DS));        { patch the new address, but don't use a_load_reg_reg, that will add a move instruction          that can confuse the reg allocator }        list.concat(Taicpu.Op_reg_reg(A_MOV,S_W,NR_SP,destreg));        if current_settings.x86memorymodel in x86_far_data_models then          list.concat(Taicpu.Op_reg_reg(A_MOV,S_W,NR_SS,GetNextReg(destreg)));      end;    procedure tcg8086.g_releasevaluepara_openarray(list : TAsmList;const l:tlocation);      begin        { Nothing to release }      end;    procedure tcg8086.get_32bit_ops(op: TOpCG; out op1, op2: TAsmOp);      begin        case op of          OP_ADD :            begin              op1:=A_ADD;              op2:=A_ADC;            end;          OP_SUB :            begin              op1:=A_SUB;              op2:=A_SBB;            end;          OP_XOR :            begin              op1:=A_XOR;              op2:=A_XOR;            end;          OP_OR :            begin              op1:=A_OR;              op2:=A_OR;            end;          OP_AND :            begin              op1:=A_AND;              op2:=A_AND;            end;          else            internalerror(200203241);        end;      end;    procedure tcg8086.add_move_instruction(instr: Taicpu);      begin        { HACK: when regvars are on, don't notify the register allocator of any          direct moves to BX, so it doesn't try to coalesce them. Currently,          direct moves to BX are only used when returning an int64 value in          AX:BX:CX:DX. This hack fixes a common issue with functions, returning          int64, for example:        function RandomFrom(const AValues: array of Int64): Int64;          begin            result:=AValues[random(High(AValues)+1)];          end;    	push	bp    	mov	bp,sp; Var AValues located in register ireg20w; Var $highAVALUES located in register ireg21w; Var $result located in register ireg33w:ireg32w:ireg31w:ireg30w    	mov	ireg20w,word [bp+6]    	mov	ireg21w,word [bp+4]; [3] result:=AValues[random(High(AValues)+1)];    	mov	ireg22w,ireg21w    	inc	ireg22w    	mov	ax,ireg22w    	cwd    	mov	ireg23w,ax    	mov	ireg24w,dx    	push	ireg24w    	push	ireg23w    	call	SYSTEM_$$_RANDOM$LONGINT$$LONGINT    	mov	ireg25w,ax    	mov	ireg26w,dx    	mov	ireg27w,ireg25w    	mov	ireg28w,ireg27w    	mov	ireg29w,ireg28w    	mov	cl,3    	shl	ireg29w,cl; Var $result located in register ireg32w:ireg30w    	mov	ireg30w,word [ireg20w+ireg29w]    	mov	ireg31w,word [ireg20w+ireg29w+2]    	mov	ireg32w,word [ireg20w+ireg29w+4]  ; problematic section start    	mov	ireg33w,word [ireg20w+ireg29w+6]; [4] end;    	mov	bx,ireg32w  ; problematic section end    	mov	ax,ireg33w    	mov	dx,ireg30w    	mov	cx,ireg31w    	mov	sp,bp    	pop	bp    	ret	4        the problem arises, because the register allocator tries to coalesce          mov bx,ireg32w        however, in the references [ireg20w+ireg29w+const], due to the        constraints of i8086, ireg20w can only be BX (or BP, which isn't available        to the register allocator, because it's used as a base pointer) }        if (cs_opt_regvar in current_settings.optimizerswitches) and           (instr.opcode=A_MOV) and (instr.ops=2) and           (instr.oper[1]^.typ=top_reg) and (getsupreg(instr.oper[1]^.reg)=RS_BX) then          exit        else          inherited add_move_instruction(instr);      end;    procedure tcg8086.g_adjust_self_value(list:TAsmList;procdef: tprocdef;ioffset: tcgint);      var        hsym : tsym;        href : treference;        paraloc : Pcgparalocation;        return_address_size: Integer;      begin        if current_settings.x86memorymodel in x86_far_code_models then          return_address_size:=4        else          return_address_size:=2;        { calculate the parameter info for the procdef }        procdef.init_paraloc_info(callerside);        hsym:=tsym(procdef.parast.Find('self'));        if not(assigned(hsym) and               (hsym.typ=paravarsym)) then          internalerror(200305251);        paraloc:=tparavarsym(hsym).paraloc[callerside].location;        with paraloc^ do          begin            case loc of              LOC_REGISTER:                a_op_const_reg(list,OP_SUB,size,ioffset,register);              LOC_REFERENCE:                begin                  { offset in the wrapper needs to be adjusted for the stored                    return address }                  if (reference.index<>NR_BP) and (reference.index<>NR_BX) and (reference.index<>NR_DI)                    and (reference.index<>NR_SI) then                    begin                      list.concat(taicpu.op_reg(A_PUSH,S_W,NR_DI));                      list.concat(taicpu.op_reg_reg(A_MOV,S_W,reference.index,NR_DI));                      if reference.index=NR_SP then                        reference_reset_base(href,NR_DI,reference.offset+return_address_size+2,sizeof(pint))                      else                        reference_reset_base(href,NR_DI,reference.offset+return_address_size,sizeof(pint));                      href.segment:=NR_SS;                      a_op_const_ref(list,OP_SUB,size,ioffset,href);                      list.concat(taicpu.op_reg(A_POP,S_W,NR_DI));                    end                  else                    begin                      reference_reset_base(href,reference.index,reference.offset+return_address_size,sizeof(pint));                      href.segment:=NR_SS;                      a_op_const_ref(list,OP_SUB,size,ioffset,href);                    end;                end              else                internalerror(200309189);            end;            paraloc:=next;          end;      end;{ ************* 64bit operations ************ }    procedure tcg64f8086.get_64bit_ops(op:TOpCG;var op1,op2:TAsmOp);      begin        case op of          OP_ADD :            begin              op1:=A_ADD;              op2:=A_ADC;            end;          OP_SUB :            begin              op1:=A_SUB;              op2:=A_SBB;            end;          OP_XOR :            begin              op1:=A_XOR;              op2:=A_XOR;            end;          OP_OR :            begin              op1:=A_OR;              op2:=A_OR;            end;          OP_AND :            begin              op1:=A_AND;              op2:=A_AND;            end;          else            internalerror(200203241);        end;      end;    procedure tcg64f8086.a_op64_ref_reg(list : TAsmList;op:TOpCG;size : tcgsize;const ref : treference;reg : tregister64);      var        op1,op2 : TAsmOp;        tempref : treference;      begin        if not(op in [OP_NEG,OP_NOT]) then          begin            get_64bit_ops(op,op1,op2);            tempref:=ref;            tcgx86(cg).make_simple_ref(list,tempref);            list.concat(taicpu.op_ref_reg(op1,S_W,tempref,reg.reglo));            inc(tempref.offset,2);            list.concat(taicpu.op_ref_reg(op2,S_W,tempref,GetNextReg(reg.reglo)));            inc(tempref.offset,2);            list.concat(taicpu.op_ref_reg(op2,S_W,tempref,reg.reghi));            inc(tempref.offset,2);            list.concat(taicpu.op_ref_reg(op2,S_W,tempref,GetNextReg(reg.reghi)));          end        else          begin            a_load64_ref_reg(list,ref,reg);            a_op64_reg_reg(list,op,size,reg,reg);          end;      end;    procedure tcg64f8086.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);      var        op1,op2 : TAsmOp;      begin        case op of          OP_NEG :            begin              if (regsrc.reglo<>regdst.reglo) then                a_load64_reg_reg(list,regsrc,regdst);              cg.a_op_reg_reg(list,OP_NOT,OS_32,regdst.reghi,regdst.reghi);              cg.a_op_reg_reg(list,OP_NEG,OS_32,regdst.reglo,regdst.reglo);              { there's no OP_SBB, so do it directly }              list.concat(taicpu.op_const_reg(A_SBB,S_W,-1,regdst.reghi));              list.concat(taicpu.op_const_reg(A_SBB,S_W,-1,GetNextReg(regdst.reghi)));              exit;            end;          OP_NOT :            begin              if (regsrc.reglo<>regdst.reglo) then                a_load64_reg_reg(list,regsrc,regdst);              cg.a_op_reg_reg(list,OP_NOT,OS_32,regdst.reglo,regdst.reglo);              cg.a_op_reg_reg(list,OP_NOT,OS_32,regdst.reghi,regdst.reghi);              exit;            end;        end;        get_64bit_ops(op,op1,op2);        list.concat(taicpu.op_reg_reg(op1,S_W,regsrc.reglo,regdst.reglo));        list.concat(taicpu.op_reg_reg(op2,S_W,GetNextReg(regsrc.reglo),GetNextReg(regdst.reglo)));        list.concat(taicpu.op_reg_reg(op2,S_W,regsrc.reghi,regdst.reghi));        list.concat(taicpu.op_reg_reg(op2,S_W,GetNextReg(regsrc.reghi),GetNextReg(regdst.reghi)));      end;    procedure tcg64f8086.a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);      var        op1,op2 : TAsmOp;      begin        case op of          OP_AND,OP_OR,OP_XOR:            begin              cg.a_op_const_reg(list,op,OS_32,tcgint(lo(value)),reg.reglo);              cg.a_op_const_reg(list,op,OS_32,tcgint(hi(value)),reg.reghi);            end;          OP_ADD, OP_SUB:            begin              get_64bit_ops(op,op1,op2);              if (value and $ffffffffffff) = 0 then                begin                  { use a_op_const_reg to allow the use of inc/dec }                  cg.a_op_const_reg(list,op,OS_16,aint((value shr 48) and $ffff),GetNextReg(reg.reghi));                end              // can't use a_op_const_ref because this may use dec/inc              else if (value and $ffffffff) = 0 then                begin                  list.concat(taicpu.op_const_reg(op1,S_W,aint((value shr 32) and $ffff),reg.reghi));                  list.concat(taicpu.op_const_reg(op2,S_W,aint((value shr 48) and $ffff),GetNextReg(reg.reghi)));                end              else if (value and $ffff) = 0 then                begin                  list.concat(taicpu.op_const_reg(op1,S_W,aint((value shr 16) and $ffff),GetNextReg(reg.reglo)));                  list.concat(taicpu.op_const_reg(op2,S_W,aint((value shr 32) and $ffff),reg.reghi));                  list.concat(taicpu.op_const_reg(op2,S_W,aint((value shr 48) and $ffff),GetNextReg(reg.reghi)));                end              else                begin                  list.concat(taicpu.op_const_reg(op1,S_W,aint(value and $ffff),reg.reglo));                  list.concat(taicpu.op_const_reg(op2,S_W,aint((value shr 16) and $ffff),GetNextReg(reg.reglo)));                  list.concat(taicpu.op_const_reg(op2,S_W,aint((value shr 32) and $ffff),reg.reghi));                  list.concat(taicpu.op_const_reg(op2,S_W,aint((value shr 48) and $ffff),GetNextReg(reg.reghi)));                end;            end;          else            internalerror(200204021);        end;      end;    procedure tcg64f8086.a_op64_const_ref(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;const ref : treference);      var        op1,op2 : TAsmOp;        tempref : treference;      begin        tempref:=ref;        tcgx86(cg).make_simple_ref(list,tempref);        case op of          OP_AND,OP_OR,OP_XOR:            begin              cg.a_op_const_ref(list,op,OS_32,tcgint(lo(value)),tempref);              inc(tempref.offset,4);              cg.a_op_const_ref(list,op,OS_32,tcgint(hi(value)),tempref);            end;          OP_ADD, OP_SUB:            begin              get_64bit_ops(op,op1,op2);              if (value and $ffffffffffff) = 0 then                begin                  inc(tempref.offset,6);                  { use a_op_const_ref to allow the use of inc/dec }                  cg.a_op_const_ref(list,op,OS_16,aint((value shr 48) and $ffff),tempref);                end              // can't use a_op_const_ref because this may use dec/inc              else if (value and $ffffffff) = 0 then                begin                  inc(tempref.offset,4);                  list.concat(taicpu.op_const_ref(op1,S_W,aint((value shr 32) and $ffff),tempref));                  inc(tempref.offset,2);                  list.concat(taicpu.op_const_ref(op2,S_W,aint((value shr 48) and $ffff),tempref));                end              else if (value and $ffff) = 0 then                begin                  inc(tempref.offset,2);                  list.concat(taicpu.op_const_ref(op1,S_W,aint((value shr 16) and $ffff),tempref));                  inc(tempref.offset,2);                  list.concat(taicpu.op_const_ref(op2,S_W,aint((value shr 32) and $ffff),tempref));                  inc(tempref.offset,2);                  list.concat(taicpu.op_const_ref(op2,S_W,aint((value shr 48) and $ffff),tempref));                end              else                begin                  list.concat(taicpu.op_const_ref(op1,S_W,aint(value and $ffff),tempref));                  inc(tempref.offset,2);                  list.concat(taicpu.op_const_ref(op2,S_W,aint((value shr 16) and $ffff),tempref));                  inc(tempref.offset,2);                  list.concat(taicpu.op_const_ref(op2,S_W,aint((value shr 32) and $ffff),tempref));                  inc(tempref.offset,2);                  list.concat(taicpu.op_const_ref(op2,S_W,aint((value shr 48) and $ffff),tempref));                end;            end;          else            internalerror(200204022);        end;      end;    procedure create_codegen;      begin        cg := tcg8086.create;        cg64 := tcg64f8086.create;      end;end.
 |