| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535 | {    Copyright (c) 2014 by Jonas Maebe    This unit implements the code generator for Xtensa    This program is free software; you can redistribute it and/or modify    it under the terms of the GNU General Public License as published by    the Free Software Foundation; either version 2 of the License, or    (at your option) any later version.    This program is distributed in the hope that it will be useful,    but WITHOUT ANY WARRANTY; without even the implied warranty of    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the    GNU General Public License for more details.    You should have received a copy of the GNU General Public License    along with this program; if not, write to the Free Software    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. ****************************************************************************}unit cgcpu;{$i fpcdefs.inc}interface    uses       globtype,parabase,       cgbase,cgutils,cgobj,       aasmbase,aasmtai,aasmdata,aasmcpu,       cpubase,cpuinfo,       node,symconst,SymType,symdef,       rgcpu,       cg64f32;    type      tcgcpu=class(tcg)      private        procedure fixref(list : TAsmList; var ref : treference);      public        procedure init_register_allocators;override;        procedure done_register_allocators;override;       { move instructions }        procedure a_load_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister);override;        procedure a_load_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister;const ref: TReference);override;        procedure a_load_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: TReference; reg: tregister);override;        procedure a_load_const_reg(list: TAsmList; size: tcgsize; a: tcgint; reg: tregister);override;        procedure a_loadaddr_ref_reg(list: TAsmList; const ref: TReference; r: tregister);override;        procedure a_op_reg_reg(list: TAsmList; op: topcg; size: tcgsize; src, dst: tregister);override;        procedure a_op_const_reg(list: TAsmList; op: topcg; size: tcgsize; a: tcgint; reg: tregister);override;        procedure a_op_reg_reg_reg(list: TAsmList; op: topcg; size: tcgsize; src1, src2, dst: tregister);override;        procedure a_op_const_reg_reg(list : TAsmList; op : TOpCg; size : tcgsize; a : tcgint; src,dst : tregister);override;        procedure a_call_name(list:TAsmList;const s:string; weak: boolean);override;        procedure a_call_reg(list:TAsmList;Reg:tregister);override;        procedure a_jmp_name(list: TAsmList; const s: string);override;        procedure a_jmp_flags(list: TAsmList; const f: TResFlags; l: tasmlabel);override;        procedure g_proc_entry(list: TAsmList; localsize: longint; nostackframe: boolean);override;        procedure g_proc_exit(list: TAsmList; parasize: longint; nostackframe: boolean);override;        { comparison operations }        procedure a_cmp_const_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; a: tcgint; reg: tregister; l: tasmlabel); override;        procedure a_cmp_reg_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; reg1, reg2: tregister; l: tasmlabel);override;        procedure a_jmp_always(list: TAsmList; l: TAsmLabel);override;        procedure a_bit_scan_reg_reg(list: TAsmList; reverse,not_zero: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister);override;        procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: tresflags; reg: TRegister);override;        procedure g_concatcopy(list : TAsmList; const source,dest : treference; len : tcgint);override;        procedure a_loadfpu_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister);override;        procedure a_loadfpu_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister);override;        procedure a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);override;        procedure a_loadfpu_intreg_reg(list: TAsmList; fromsize, tosize: tcgsize; intreg, fpureg: tregister);override;        procedure a_loadfpu_reg_intreg(list: TAsmList; fromsize, tosize: tcgsize; fpureg, intreg: tregister);override;        procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);        procedure g_overflowcheck(list: TAsmList; const Loc:tlocation; def:tdef);override;        function create_data_entry(symbol: TAsmSymbol; offset: asizeint): TAsmLabel;      end;      tcg64fxtensa = class(tcg64f32)        procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;        procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;        procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;        procedure a_op64_reg_reg_reg(list : TAsmList; op : TOpCG;size : tcgsize; regsrc1,regsrc2,regdst : tregister64);override;        //procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;        //procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;        //procedure a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;        //procedure a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;        //procedure a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);override;        //procedure a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);override;      end;    procedure create_codegen;    const      TOpCG2AsmOp: array[topcg] of TAsmOp = (        A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MULL,A_MULL,A_NEG,A_NONE,A_OR,A_SRA,A_SLL,A_SRL,A_SUB,A_XOR,A_NONE,A_NONE      );{      );TOpCG2AsmOpReg: array[topcg] of TAsmOp = (        A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NEG,A_MVN,A_ORR,A_ASRV,A_LSLV,A_LSRV,A_SUB,A_EOR,A_NONE,A_RORV      );      TOpCG2AsmOpImm: array[topcg] of TAsmOp = (        A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NEG,A_MVN,A_ORR,A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR      );      TOpCmp2AsmCond: array[topcmp] of TAsmCond = (C_NONE,C_EQ,C_GT,        C_LT,C_GE,C_LE,C_NE,C_LS,C_CC,C_CS,C_HI      ); }implementation  uses    globals,verbose,systems,cutils,    paramgr,fmodule,    symtable,symsym,    tgobj,    procinfo,cpupi;                    const    TOpCmp2AsmCond: array[TOpCmp] of TAsmCond = (      C_None,      C_EQ,      C_None,      C_LT,      C_GE,      C_None,      C_NE,      C_None,      C_LTU,      C_GEU,      C_None    );    procedure tcgcpu.init_register_allocators;      begin        inherited init_register_allocators;        if target_info.abi = abi_xtensa_call0 then          rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,              [RS_A2,RS_A3,RS_A4,RS_A5,RS_A6,RS_A7,{RS_A8,}RS_A9,               RS_A10,RS_A11,RS_A12,RS_A13,RS_A14{,RS_A15}],first_int_imreg,[])        else          rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,              [RS_A2,RS_A3,RS_A4,RS_A5,RS_A6,RS_A7,RS_A8,RS_A9,               RS_A10,RS_A11,RS_A12,RS_A13,RS_A14,RS_A15],first_int_imreg,[]);        rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,            [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7,RS_F8,RS_F9,             RS_F10,RS_F11,RS_F12,RS_F13,RS_F14,RS_F15],first_fpu_imreg,[]);        rg[R_SPECIALREGISTER]:=trgcpu.create(R_SPECIALREGISTER,R_SUBNONE,            [RS_B0,RS_B1,RS_B2,RS_B3,RS_B4,RS_B5,RS_B6,RS_B7,RS_B8,RS_B9,             RS_B10,RS_B11,RS_B12,RS_B13,RS_B14,RS_B15],first_flag_imreg,[]);      end;    procedure tcgcpu.done_register_allocators;      begin        rg[R_INTREGISTER].free;        rg[R_FPUREGISTER].free;        rg[R_SPECIALREGISTER].free;        inherited done_register_allocators;      end;    procedure tcgcpu.a_load_reg_reg(list : TAsmList; fromsize,tosize : tcgsize;      reg1,reg2 : tregister);      var        conv_done : Boolean;        instr : taicpu;      begin         if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then           internalerror(2020030710);         conv_done:=false;         if tosize<>fromsize then           begin             conv_done:=true;             if tcgsize2size[tosize]<=tcgsize2size[fromsize] then              fromsize:=tosize;             case fromsize of                OS_8:                  list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,reg2,reg1,0,8));                OS_S8:                  begin                    if CPUXTENSA_HAS_SEXT in cpu_capabilities[current_settings.cputype] then                      list.concat(taicpu.op_reg_reg_const(A_SEXT,reg2,reg1,7))                    else                      begin                        list.concat(taicpu.op_reg_reg_const(A_SLLI,reg2,reg1,24));                        list.concat(taicpu.op_reg_reg_const(A_SRAI,reg2,reg2,24));                      end;                    if tosize=OS_16 then                      list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,reg2,reg2,0,16));                  end;                OS_16:                  list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,reg2,reg1,0,16));                OS_S16:                  if CPUXTENSA_HAS_SEXT in cpu_capabilities[current_settings.cputype] then                    list.concat(taicpu.op_reg_reg_const(A_SEXT,reg2,reg1,15))                  else                    begin                      list.concat(taicpu.op_reg_reg_const(A_SLLI,reg2,reg1,16));                      list.concat(taicpu.op_reg_reg_const(A_SRAI,reg2,reg2,16));                    end;                else                  conv_done:=false;              end;           end;         if not conv_done and (reg1<>reg2) then           begin             { same size, only a register mov required }             instr:=taicpu.op_reg_reg(A_MOV,reg2,reg1);             list.Concat(instr);             { Notify the register allocator that we have written a move instruction so               it can try to eliminate it. }             add_move_instruction(instr);           end;       end;    procedure tcgcpu.a_load_reg_ref(list : TAsmList; fromsize,tosize : tcgsize;      reg : tregister; const ref : TReference);      var        op: TAsmOp;        href : treference;      begin        if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then          FromSize := ToSize;        case tosize of          { signed integer registers }          OS_8,          OS_S8:            op:=A_S8I;          OS_16,          OS_S16:            op:=A_S16I;          OS_32,          OS_S32:            op:=A_S32I;          else            InternalError(2020030804);        end;        href:=ref;        if assigned(href.symbol) or          (href.index<>NR_NO) or          ((op=A_S8I) and ((href.offset<0) or (href.offset>255))) or          ((op=A_S16I) and ((href.offset<0) or (href.offset>510) or (href.offset mod 2<>0))) or          ((op=A_S32I) and ((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then          fixref(list,href);        list.concat(taicpu.op_reg_ref(op,reg,href));      end;    procedure tcgcpu.a_load_ref_reg(list : TAsmList; fromsize,tosize : tcgsize;      const ref : TReference; reg : tregister);      var        href: treference;        op: TAsmOp;        tmpreg: TRegister;      begin        case fromsize of          OS_8: op:=A_L8UI;          OS_16: op:=A_L16UI;          OS_S8: op:=A_L8UI;          OS_S16: op:=A_L16SI;          OS_64,OS_S64, { This only happens if tosize is smaller than fromsize }          { We can therefore only consider the low 32-bit of the 64bit value }          OS_32,          OS_S32: op:=A_L32I;        else          internalerror(2020030805);        end;        href:=ref;        if assigned(href.symbol) or          (href.index<>NR_NO) or          ((op=A_L8UI) and ((href.offset<0) or (href.offset>255))) or          ((op in [A_L16SI,A_L16UI]) and ((href.offset<0) or (href.offset>510) or (href.offset mod 2<>0))) or          ((op=A_L32I) and ((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) or          ((href.base=NR_NO) and (href.index=NR_NO)) then          fixref(list,href);        list.concat(taicpu.op_reg_ref(op,reg,href));        if (fromsize=OS_S8) and not(tosize in [OS_S8,OS_8]) then          if CPUXTENSA_HAS_SEXT in cpu_capabilities[current_settings.cputype] then            list.concat(taicpu.op_reg_reg_const(A_SEXT,reg,reg,7))          else            begin              list.concat(taicpu.op_reg_reg_const(A_SLLI,reg,reg,24));              list.concat(taicpu.op_reg_reg_const(A_SRAI,reg,reg,24));            end;        if (fromsize<>tosize) and (not (tosize in [OS_SINT,OS_INT])) then          a_load_reg_reg(list,fromsize,tosize,reg,reg);      end;    procedure tcgcpu.a_load_const_reg(list : TAsmList; size : tcgsize;      a : tcgint; reg : tregister);      var        hr : treference;        l : TAsmLabel;      begin        if (a>=-2048) and (a<=2047) then          list.Concat(taicpu.op_reg_const(A_MOVI,reg,a))        else          begin            reference_reset(hr,4,[]);            hr.symbol:=create_data_entry(nil,longint(a));            list.concat(taicpu.op_reg_ref(A_L32R,reg,hr));          end;      end;    procedure tcgcpu.fixref(list : TAsmList;var ref : treference);      var        tmpreg, tmpreg2 : tregister;        tmpref : treference;        l : tasmlabel;      begin        { create consts entry }        if assigned(ref.symbol) or (ref.offset<-2048) or (ref.offset>2047) or          ((ref.base=NR_NO) and (ref.index=NR_NO)) then          begin            reference_reset(tmpref,4,[]);            tmpreg:=NR_NO;            { load consts entry }            tmpreg:=getintregister(list,OS_INT);            if ref.symbol=nil then              a_load_const_reg(list,OS_ADDR,ref.offset,tmpreg)            else              begin                tmpref.symbol:=create_data_entry(ref.symbol,ref.offset);                list.concat(taicpu.op_reg_ref(A_L32R,tmpreg,tmpref));              end;            if ref.base<>NR_NO then              begin                if ref.index<>NR_NO then                  begin                    list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));                    ref.base:=tmpreg;                  end                else                  ref.index:=tmpreg;              end            else              ref.base:=tmpreg;          end        else if ref.offset<>0 then          begin            tmpreg:=getintregister(list,OS_INT);            if (ref.offset>=-128) and (ref.offset<=127) then              begin                list.concat(taicpu.op_reg_reg_const(A_ADDI,tmpreg,ref.base,ref.offset));                ref.base:=tmpreg;              end            else              begin                list.concat(taicpu.op_reg_const(A_MOVI,tmpreg,ref.offset));                if ref.base<>NR_NO then                  begin                    if ref.index<>NR_NO then                      begin                        list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));                        ref.base:=tmpreg;                      end                    else                      ref.index:=tmpreg;                  end                else                  ref.base:=tmpreg;              end;          end;        if ref.index<>NR_NO then          begin            if ref.base<>NR_NO then              begin                tmpreg:=getintregister(list,OS_INT);                list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));                ref.base:=tmpreg;              end            else              ref.base:=ref.index;            ref.index:=NR_NO;          end;        ref.offset:=0;        ref.symbol:=nil;      end;    procedure tcgcpu.a_loadaddr_ref_reg(list : TAsmList;      const ref : TReference; r : tregister);       var        b : byte;        tmpref : treference;        instr : taicpu;      begin        tmpref:=ref;        { Be sure to have a base register }        if tmpref.base=NR_NO then          begin            tmpref.base:=tmpref.index;            tmpref.index:=NR_NO;          end;        if assigned(tmpref.symbol) then          fixref(list,tmpref);        { expect a base here if there is an index }        if (tmpref.base=NR_NO) and (tmpref.index<>NR_NO) then          internalerror(200312022);        if tmpref.index<>NR_NO then          begin            a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpref.base,tmpref.index,r);            if tmpref.offset<>0 then              a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,r,r);          end        else          begin            if tmpref.base=NR_NO then              a_load_const_reg(list,OS_ADDR,tmpref.offset,r)            else              if tmpref.offset<>0 then                a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,tmpref.base,r)              else                begin                  instr:=taicpu.op_reg_reg(A_MOV,r,tmpref.base);                  list.concat(instr);                  add_move_instruction(instr);                end;          end;      end;    procedure tcgcpu.a_op_reg_reg(list : TAsmList; op : topcg; size : tcgsize; src,dst : tregister);      var        tmpreg : TRegister;      begin        if op = OP_NEG then          begin            list.concat(taicpu.op_reg_reg(A_NEG,dst,src));            maybeadjustresult(list,OP_NEG,size,dst);          end        else if op = OP_NOT then          begin            tmpreg:=getintregister(list,size);            list.concat(taicpu.op_reg_const(A_MOVI,tmpreg,-1));            list.concat(taicpu.op_reg_reg_reg(A_XOR,dst,tmpreg,src));            maybeadjustresult(list,OP_NOT,size,dst);          end        else          a_op_reg_reg_reg(list,op,size,src,dst,dst);      end;    procedure tcgcpu.a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister);      var        l1 : longint;        tmpreg : TRegister;      begin        optimize_op_const(size, op, a);        case op of          OP_NONE:            begin              if src <> dst then                a_load_reg_reg(list, size, size, src, dst);              exit;            end;          OP_MOVE:            begin              a_load_const_reg(list, size, a, dst);              exit;            end;          else            ;        end;        { there could be added some more sophisticated optimizations }        if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then          a_op_reg_reg(list,OP_NEG,size,src,dst)        { we do this here instead in the peephole optimizer because          it saves us a register }        else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) then          a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)        { we cannot make use of SUB(X) here because the inital shift might overflow }        else if (op in [OP_MUL,OP_IMUL]) and (a=3) then          list.concat(taicpu.op_reg_reg_reg(A_ADDX2,dst,src,src))        else if (op in [OP_MUL,OP_IMUL]) and (a=5) then          list.concat(taicpu.op_reg_reg_reg(A_ADDX4,dst,src,src))        else if (op in [OP_MUL,OP_IMUL]) and (a=9) then          list.concat(taicpu.op_reg_reg_reg(A_ADDX8,dst,src,src))        else if (op in [OP_MUL,OP_IMUL]) and (src<>dst) and ispowerof2(a-8,l1) then          begin            a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst);            list.concat(taicpu.op_reg_reg_reg(A_ADDX8,dst,src,dst));          end        else if (op in [OP_MUL,OP_IMUL]) and (src<>dst) and ispowerof2(a-4,l1) then          begin            a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst);            list.concat(taicpu.op_reg_reg_reg(A_ADDX4,dst,src,dst));          end        else if (op in [OP_MUL,OP_IMUL]) and (src<>dst) and ispowerof2(a-2,l1) then          begin            a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst);            list.concat(taicpu.op_reg_reg_reg(A_ADDX2,dst,src,dst));          end        else if (op in [OP_MUL,OP_IMUL]) and (src<>dst) and ispowerof2(a-1,l1) then          begin            a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst);            list.concat(taicpu.op_reg_reg_reg(A_ADD,dst,src,dst));          end        else if (op=OP_ADD) and (a>=-128) and (a<=127) then          list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,src,a))        else if (op=OP_ADD) and (a>=-128-32768) and (a<=127+32512) then          begin{$ifdef EXTDEBUG}            list.concat(tai_comment.Create(strpnew('Value: '+tostr(a))));{$endif EXTDEBUG}            list.concat(taicpu.op_reg_reg_const(A_ADDMI,dst,src,Smallint((a+128) and $ff00)));            list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,dst,Shortint(a and $ff)));          end        else if (op=OP_SUB) and (a>=-127) and (a<=128) then          list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,src,-a))        else if (op=OP_SUB) and (a>=-127-32512) and (a<=128+32768) then          begin{$ifdef EXTDEBUG}            list.concat(tai_comment.Create(strpnew('Value: '+tostr(a))));{$endif EXTDEBUG}            a:=-a;            list.concat(taicpu.op_reg_reg_const(A_ADDMI,dst,src,Smallint((a+128) and $ff00)));            list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,dst,Shortint(a and $ff)));          end        else if (op=OP_SHL) and (a>=1) and (a<=31) then          list.concat(taicpu.op_reg_reg_const(A_SLLI,dst,src,a))        else if (op=OP_SAR) and (a>=0) and (a<=31) then          list.concat(taicpu.op_reg_reg_const(A_SRAI,dst,src,a))        else if (op=OP_SHR) and (a>=0) and (a<=15) then          list.concat(taicpu.op_reg_reg_const(A_SRLI,dst,src,a))        else if (op=OP_SHR) and (a>15) and (a<=31) then          list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,dst,src,a,32-a))        else if (op=OP_AND) and (63-BsrQWord(qword(a))+PopCnt(QWord(a))=64) and (PopCnt(QWord(a))<=16) then          list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,dst,src,0,PopCnt(QWord(a))))        else          begin            tmpreg:=getintregister(list,size);            a_load_const_reg(list,size,a,tmpreg);            a_op_reg_reg_reg(list,op,size,tmpreg,src,dst);          end;        maybeadjustresult(list,op,size,dst);      end;    procedure tcgcpu.a_op_const_reg(list : TAsmList; op : topcg; size : tcgsize; a : tcgint; reg : tregister);      begin        a_op_const_reg_reg(list,op,size,a,reg,reg);      end;    procedure tcgcpu.a_op_reg_reg_reg(list : TAsmList; op : topcg;      size : tcgsize; src1,src2,dst : tregister);      var        tmpreg : TRegister;      begin        if op=OP_NOT then          begin            tmpreg:=getintregister(list,size);            list.concat(taicpu.op_reg_const(A_MOVI,tmpreg,-1));            maybeadjustresult(list,op,size,dst);          end        else if op=OP_NEG then          begin            list.concat(taicpu.op_reg_reg(A_NEG,dst,src1));            maybeadjustresult(list,op,size,dst);          end        else if op in [OP_SAR,OP_SHL,OP_SHR] then          begin            if op=OP_SHL then              list.concat(taicpu.op_reg(A_SSL,src1))            else              list.concat(taicpu.op_reg(A_SSR,src1));            list.concat(taicpu.op_reg_reg(TOpCG2AsmOp[op],dst,src2));            maybeadjustresult(list,op,size,dst);          end        else          case op of            OP_MOVE:              a_load_reg_reg(list,size,size,src1,dst);            else              begin                list.concat(taicpu.op_reg_reg_reg(TOpCG2AsmOp[op],dst,src2,src1));                maybeadjustresult(list,op,size,dst);              end;          end;       end;    procedure tcgcpu.a_call_name(list : TAsmList; const s : string;      weak : boolean);      begin        if not weak then          list.concat(taicpu.op_sym(txtensaprocinfo(current_procinfo).callins,current_asmdata.RefAsmSymbol(s,AT_FUNCTION)))        else          list.concat(taicpu.op_sym(txtensaprocinfo(current_procinfo).callins,current_asmdata.WeakRefAsmSymbol(s,AT_FUNCTION)));      end;    procedure tcgcpu.a_call_reg(list : TAsmList; Reg : tregister);      begin        list.concat(taicpu.op_reg(txtensaprocinfo(current_procinfo).callxins,reg));      end;    procedure tcgcpu.a_jmp_name(list : TAsmList; const s : string);      var        ai : taicpu;        tmpreg: TRegister;      begin        { for now, we use A15 here, however, this is not save as it might contain an argument }        ai:=TAiCpu.op_sym_reg(A_J,current_asmdata.RefAsmSymbol(s,AT_FUNCTION),NR_A15);        ai.oppostfix := PF_L; // if destination is too far for J then assembler can convert to JX        ai.is_jmp:=true;        list.Concat(ai);      end;    procedure tcgcpu.a_jmp_flags(list: TAsmList; const f: TResFlags; l: tasmlabel);      var        instr: taicpu;      begin        if CPUXTENSA_HAS_BOOLEAN_OPTION in cpu_capabilities[current_settings.cputype] then          begin            instr:=taicpu.op_reg_sym(A_B,f.register,l);            instr.condition:=flags_to_cond(f.flag);            instr.is_jmp:=true;            list.concat(instr);          end        else          Internalerror(2020070401);      end;    procedure tcgcpu.g_proc_entry(list : TAsmList; localsize : longint;      nostackframe : boolean);      var         ref : treference;         r : byte;         regs : tcpuregisterset;         stackmisalignment : pint;         regoffset : LongInt;         stack_parameters : Boolean;         registerarea : PtrInt;         l : TAsmLabel;      begin        LocalSize:=align(LocalSize,4);        stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);        { call instruction does not put anything on the stack }        registerarea:=0;        if not(nostackframe) then          begin            regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);            a_reg_alloc(list,NR_STACK_POINTER_REG);            case target_info.abi of              abi_xtensa_call0:                begin                  list.concat(tai_comment.Create(strpnew('  Start of abi_call0 entry localsize='+tostr(localsize))));                  if current_procinfo.framepointer<>NR_STACK_POINTER_REG then                    Include(regs,RS_A15);                  if pi_do_call in current_procinfo.flags then                    Include(regs,RS_A0);                  if regs<>[] then                     begin                       for r:=RS_A0 to RS_A15 do                         if r in regs then                           inc(registerarea,4);                     end;                  if stack_parameters and (pi_estimatestacksize in current_procinfo.flags) then                    begin                      list.concat(tai_comment.Create(strpnew('Stackframe size was estimated before code generation due to stack parameters')));                      list.concat(tai_comment.Create(strpnew('  Calculated stackframe size: '+tostr(txtensaprocinfo(current_procinfo).stackframesize))));                      list.concat(tai_comment.Create(strpnew('  Max. outgoing parameter size: '+tostr(txtensaprocinfo(current_procinfo).maxpushedparasize))));                      list.concat(tai_comment.Create(strpnew('  End of last temporary location: '+tostr(tg.lasttemp))));                      list.concat(tai_comment.Create(strpnew('  Size of register area: '+tostr(registerarea))));                      list.concat(tai_comment.Create(strpnew('  Required size after code generation: '+tostr(localsize))));                      if localsize>txtensaprocinfo(current_procinfo).stackframesize then                        internalerror(2020091001);                      localsize:=txtensaprocinfo(current_procinfo).stackframesize;                    end                  else                    begin                      inc(localsize,registerarea);                      localsize:=align(localsize,current_settings.alignment.localalignmax);                    end;                  if LocalSize<>0 then                    begin                      a_reg_alloc(list,NR_STACK_POINTER_REG);                      { not sure if 32512 is the correct value or if it can be larger }                      if Localsize>32512 then                        begin                          reference_reset(ref,4,[]);                          ref.symbol:=create_data_entry(nil,-localsize);                          list.concat(tai_comment.Create(strpnew(' Decreasing stack pointer by localsize='+tostr(localsize)+' using A8 register')));                          list.concat(taicpu.op_reg_ref(A_L32R,NR_A8,ref));                          list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_A8));                        end                      else                        begin                          list.concat(tai_comment.Create(strpnew(' Decreasing stack pointer by localsize='+tostr(localsize)+' using A8 register')));                          list.concat(taicpu.op_reg_reg_const(A_ADDI,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,-localsize));                        end;                    end;                  reference_reset(ref,4,[]);                  ref.base:=NR_STACK_POINTER_REG;                  ref.offset:=localsize;                  if localsize>1024 then                    begin                      list.concat(tai_comment.Create(strpnew('  Special entry code of abi_xtensa_call0 entry localsize='+tostr(localsize))));                      if localsize<=1024+32512 then                        begin                          list.concat(taicpu.op_reg_reg_const(A_ADDI,NR_A8,NR_STACK_POINTER_REG,localsize-registerarea));                          reference_reset(ref,4,[]);                          ref.base:=NR_A8;                          ref.offset:=registerarea;                        end                      else                        begin                          reference_reset(ref,4,[]);                          ref.symbol:=create_data_entry(nil,localsize-registerarea);                          list.concat(taicpu.op_reg_ref(A_L32R,NR_A8,ref));                          list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_A8,NR_A8,NR_STACK_POINTER_REG));                          reference_reset(ref,4,[]);                          ref.base:=NR_A8;                          ref.offset:=registerarea;                        end;                    end;                  if current_procinfo.framepointer<>NR_STACK_POINTER_REG then                    begin                      dec(ref.offset,4);                      list.concat(tai_comment.Create(strpnew(' Storing reg A15 at offset='+tostr(ref.offset))));                      list.concat(taicpu.op_reg_ref(A_S32I,NR_A15,ref));                      a_reg_alloc(list,NR_FRAME_POINTER_REG);                      list.concat(taicpu.op_reg_reg(A_MOV,NR_A15,NR_STACK_POINTER_REG));                    end;                  if regs<>[] then                    begin                      for r:=RS_A14 downto RS_A0 do                        if r in regs then                          begin                            dec(ref.offset,4);                            list.concat(tai_comment.Create(strpnew(' Storing reg '+std_regname(newreg(R_INTREGISTER,r,R_SUBWHOLE))+' at offset='+tostr(ref.offset))));                            list.concat(taicpu.op_reg_ref(A_S32I,newreg(R_INTREGISTER,r,R_SUBWHOLE),ref));                          end;                    end;                end;              abi_xtensa_windowed:                begin                  list.concat(tai_comment.Create(strpnew('  Start of abi_windowed entry localsize='+tostr(localsize))));                  if stack_parameters and (pi_estimatestacksize in current_procinfo.flags) then                    begin                      list.concat(tai_comment.Create(strpnew('Stackframe size was estimated before code generation due to stack parameters')));                      list.concat(tai_comment.Create(strpnew('  Calculated stackframe size: '+tostr(txtensaprocinfo(current_procinfo).stackframesize))));                      list.concat(tai_comment.Create(strpnew('  Max. outgoing parameter size: '+tostr(txtensaprocinfo(current_procinfo).maxpushedparasize))));                      list.concat(tai_comment.Create(strpnew('  End of last temporary location: '+tostr(tg.lasttemp))));                      list.concat(tai_comment.Create(strpnew('  Max. window rotation in bytes: '+tostr(txtensaprocinfo(current_procinfo).maxcall*4))));                      list.concat(tai_comment.Create(strpnew('  Required size after code generation: '+tostr(localsize))));                      { should never happen as localsize is derived from                        txtensaprocinfo(current_procinfo).stackframesize }                      if localsize>txtensaprocinfo(current_procinfo).stackframesize then                        internalerror(2020031402);                      localsize:=txtensaprocinfo(current_procinfo).stackframesize;                    end                  else                    begin                      localsize:=align(localsize,current_settings.alignment.localalignmax);                      inc(localsize,4*4);                      if pi_do_call in current_procinfo.flags then                        inc(localsize,txtensaprocinfo(current_procinfo).maxcall*4);                    end;                  if localsize<0 then                    Internalerror(2020083001);                  if localsize>32760 then                    begin                      list.concat(taicpu.op_reg_const(A_ENTRY,NR_STACK_POINTER_REG,32));                      reference_reset(ref,4,[]);                      ref.symbol:=create_data_entry(nil,longint(localsize-32));                      list.concat(taicpu.op_reg_ref(A_L32R,NR_A8,ref));                      list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_A8,NR_STACK_POINTER_REG,NR_A8));                      list.concat(taicpu.op_reg_reg(A_MOVSP,NR_STACK_POINTER_REG,NR_A8));                    end                  else                    list.concat(taicpu.op_reg_const(A_ENTRY,NR_STACK_POINTER_REG,localsize));                end;              else                Internalerror(2020031401);            end;          end;      end;    procedure tcgcpu.g_proc_exit(list : TAsmList; parasize : longint;     nostackframe : boolean);      var         ref : treference;         r : byte;         regs : tcpuregisterset;         stackmisalignment : pint;         regoffset : LongInt;         stack_parameters : Boolean;         registerarea : PtrInt;         l : TAsmLabel;         LocalSize: longint;      begin        case target_info.abi of          abi_xtensa_windowed:            list.Concat(taicpu.op_none(A_RETW));          abi_xtensa_call0:            begin              if not(nostackframe) then                begin                  LocalSize:=current_procinfo.calc_stackframe_size;                  LocalSize:=align(LocalSize,4);                  stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);                  registerarea:=0;                  regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);                  if current_procinfo.framepointer<>NR_STACK_POINTER_REG then                    Include(regs,RS_A15);                  if pi_do_call in current_procinfo.flags then                    Include(regs,RS_A0);                  if regs<>[] then                     begin                       for r:=RS_A0 to RS_A15 do                         if r in regs then                           inc(registerarea,4);                     end;                  { do we use then estimated stack size? }                  if not(stack_parameters and (pi_estimatestacksize in current_procinfo.flags)) then                    begin                      inc(localsize,registerarea);                      localsize:=align(localsize,current_settings.alignment.localalignmax);                    end;                  if LocalSize<>0 then                    begin                      // Determine reference mode required to access stack                      reference_reset(ref,4,[]);                      ref.base:=NR_STACK_POINTER_REG;                      ref.offset:=localsize;                      if localsize>1024 then                        begin                          if localsize<=1024+32512 then                            begin                              list.concat(taicpu.op_reg_reg_const(A_ADDI,NR_A8,NR_STACK_POINTER_REG,ref.offset-registerarea));                              ref.offset:=registerarea;                              ref.base:=NR_A8;                            end                          else                            begin                              reference_reset(ref,4,[]);                              ref.symbol:=create_data_entry(nil,ref.offset-registerarea);                              list.concat(taicpu.op_reg_ref(A_L32R,NR_A8,ref));                              list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_A8,NR_A8,NR_STACK_POINTER_REG));                              reference_reset(ref,4,[]);                              ref.base:=NR_A8;                              ref.offset:=registerarea;                            end;                        end;                      // restore a15 if used                      if current_procinfo.framepointer<>NR_STACK_POINTER_REG then                        begin                          dec(ref.offset,4);                          list.concat(tai_comment.Create(strpnew(' Restoring reg A15 from offset='+tostr(ref.offset))));                          list.concat(taicpu.op_reg_ref(A_L32I,NR_A15,ref));                          a_reg_dealloc(list,NR_FRAME_POINTER_REG);                        end;                      // restore rest of registers                      if regs<>[] then                        begin                          for r:=RS_A14 downto RS_A0 do                            if r in regs then                              begin                                dec(ref.offset,4);                                list.concat(tai_comment.Create(strpnew(' Restoring reg '+std_regname(newreg(R_INTREGISTER,r,R_SUBWHOLE))+' from offset='+tostr(ref.offset))));                                list.concat(taicpu.op_reg_ref(A_L32I,newreg(R_INTREGISTER,r,R_SUBWHOLE),ref));                              end;                        end;                      // restore stack pointer                      { not sure if 32512 is the correct value or if it can be larger }                      list.concat(tai_comment.Create(strpnew(' Restoring stack pointer')));                      if Localsize>32512 then                        begin                          reference_reset(ref,4,[]);                          ref.symbol:=create_data_entry(nil,localsize);                          list.concat(taicpu.op_reg_ref(A_L32R,NR_A8,ref));                          list.concat(taicpu.op_reg_reg_reg(A_ADD,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,NR_A8));                        end                      else                        list.concat(taicpu.op_reg_reg_const(A_ADDI,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,localsize));                      a_reg_dealloc(list,NR_STACK_POINTER_REG);                    end;                  end;              list.Concat(taicpu.op_none(A_RET));            end          else            Internalerror(2020031403);        end;      end;    procedure tcgcpu.a_cmp_const_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; a: tcgint; reg: tregister; l: tasmlabel);      function is_b4const(v: tcgint): boolean;        begin          case v of            -1,1,2,3,4,5,6,7,8,            10,12,16,32,64,128,256:              result:=true;          else            result:=false;          end;        end;      function is_b4constu(v: tcgint): boolean;        begin          case v of            32768,65536,            2,3,4,5,6,7,8,            10,12,16,32,64,128,256:              result:=true;          else            result:=false;          end;        end;      var        op: TAsmCond;        instr: taicpu;      begin        if (a=0) and (cmp_op in [OC_EQ,OC_NE,OC_LT,OC_GTE]) then          begin            case cmp_op of              OC_EQ: op:=C_EQZ;              OC_NE: op:=C_NEZ;              OC_LT: op:=C_LTZ;              OC_GTE: op:=C_GEZ;            else              Internalerror(2020030806);            end;                 instr:=taicpu.op_reg_sym(A_B,reg,l);            instr.condition:=op;            instr.is_jmp:=true;            list.concat(instr);          end        else if is_b4const(a) and                (cmp_op in [OC_EQ,OC_NE,OC_LT,OC_GTE]) then          begin            case cmp_op of              OC_EQ: op:=C_EQI;              OC_NE: op:=C_NEI;              OC_LT: op:=C_LTI;              OC_GTE: op:=C_GEI;            else              Internalerror(2020030807);            end;            instr:=taicpu.op_reg_const_sym(A_B,reg,a,l);            instr.condition:=op;            instr.is_jmp:=true;            list.concat(instr);          end        else if is_b4constu(a) and                (cmp_op in [OC_B,OC_AE]) then          begin            case cmp_op of              OC_B: op:=C_LTUI;              OC_AE: op:=C_GEUI;            else              Internalerror(2020030808);            end;            instr:=taicpu.op_reg_const_sym(A_B,reg,a,l);            instr.condition:=op;            instr.is_jmp:=true;            list.concat(instr);          end        else          inherited a_cmp_const_reg_label(list, size, cmp_op, a, reg, l);      end;    procedure tcgcpu.a_cmp_reg_reg_label(list : TAsmList; size : tcgsize;        cmp_op : topcmp; reg1,reg2 : tregister; l : tasmlabel);      var        tmpreg: TRegister;        instr: taicpu;      begin        if TOpCmp2AsmCond[cmp_op]=C_None then          begin            cmp_op:=swap_opcmp(cmp_op);            tmpreg:=reg1;            reg1:=reg2;            reg2:=tmpreg;          end;        instr:=taicpu.op_reg_reg_sym(A_B,reg2,reg1,l);        instr.condition:=TOpCmp2AsmCond[cmp_op];        instr.is_jmp:=true;        list.concat(instr);      end;    procedure tcgcpu.a_jmp_always(list : TAsmList; l : TAsmLabel);      var        ai : taicpu;      begin        if l.bind in [AB_GLOBAL] then          begin          { for now, we use A15 here, however, this is not save as it might contain an argument, I have not figured out a            solution yet }            ai:=taicpu.op_sym_reg(A_J,l,NR_A15);            ai.oppostfix := PF_L;          end        else          ai:=taicpu.op_sym(A_J,l);        ai.is_jmp:=true;        list.concat(ai);      end;    procedure tcgcpu.g_flags2reg(list: TAsmList; size: TCgSize; const f: tresflags; reg: TRegister);      var        hregister: TRegister;        instr: taicpu;      begin        a_load_const_reg(list,size,0,reg);        hregister:=getintregister(list,size);        a_load_const_reg(list,size,1,hregister);        instr:=taicpu.op_reg_reg_reg(A_MOV,reg,hregister,f.register);        instr.condition:=flags_to_cond(f.flag);        list.concat(instr);      end;    procedure tcgcpu.g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);      var        tmpreg1, hreg, countreg: TRegister;        src, dst, src2, dst2: TReference;        lab:      tasmlabel;        Count, count2: aint;        function reference_is_reusable(const ref: treference): boolean;          begin            result:=(ref.base<>NR_NO) and (ref.index=NR_NO) and               (ref.symbol=nil);          end;      begin        src2:=source;        fixref(list,src2);        dst2:=dest;        fixref(list,dst2);        if len > high(longint) then          internalerror(2002072704);        { A call (to FPC_MOVE) requires the outgoing parameter area to be properly          allocated on stack. This can only be done before tmipsprocinfo.set_first_temp_offset,          i.e. before secondpass. Other internal procedures request correct stack frame          by setting pi_do_call during firstpass, but for this particular one it is impossible.          Therefore, if the current procedure is a leaf one, we have to leave it that way. }        { anybody wants to determine a good value here :)? }        if (len > 100) and           assigned(current_procinfo) and           (pi_do_call in current_procinfo.flags) then          g_concatcopy_move(list, src2, dst2, len)        else        begin          Count := len div 4;          if (count<=4) and reference_is_reusable(src2) then            src:=src2          else            begin              reference_reset(src,sizeof(aint),[]);              { load the address of src2 into src.base }              src.base := GetAddressRegister(list);              a_loadaddr_ref_reg(list, src2, src.base);            end;          if (count<=4) and reference_is_reusable(dst2) then            dst:=dst2          else            begin              reference_reset(dst,sizeof(aint),[]);              { load the address of dst2 into dst.base }              dst.base := GetAddressRegister(list);              a_loadaddr_ref_reg(list, dst2, dst.base);            end;          { generate a loop }          if Count > 4 then          begin            countreg := GetIntRegister(list, OS_INT);            tmpreg1  := GetIntRegister(list, OS_INT);            a_load_const_reg(list, OS_INT, Count, countreg);            current_asmdata.getjumplabel(lab);            if CPUXTENSA_HAS_LOOPS in cpu_capabilities[current_settings.cputype] then              begin                list.concat(taicpu.op_reg_sym(A_LOOP, countreg, lab));                list.concat(taicpu.op_reg_ref(A_L32I, tmpreg1, src));                list.concat(taicpu.op_reg_ref(A_S32I, tmpreg1, dst));                list.concat(taicpu.op_reg_reg_const(A_ADDI, src.base, src.base, 4));                list.concat(taicpu.op_reg_reg_const(A_ADDI, dst.base, dst.base, 4));                a_label(list, lab);              end            else              begin                a_label(list, lab);                list.concat(taicpu.op_reg_ref(A_L32I, tmpreg1, src));                list.concat(taicpu.op_reg_ref(A_S32I, tmpreg1, dst));                list.concat(taicpu.op_reg_reg_const(A_ADDI, src.base, src.base, 4));                list.concat(taicpu.op_reg_reg_const(A_ADDI, dst.base, dst.base, 4));                list.concat(taicpu.op_reg_reg_const(A_ADDI, countreg, countreg, -1));                a_cmp_const_reg_label(list,OS_INT,OC_NE,0,countreg,lab);                { keep the registers alive }                list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));              end;            { keep the registers alive }            list.concat(taicpu.op_reg_reg(A_MOV,src.base,src.base));            list.concat(taicpu.op_reg_reg(A_MOV,dst.base,dst.base));            len := len mod 4;          end;          { unrolled loop }          Count := len div 4;          if Count > 0 then          begin            tmpreg1 := GetIntRegister(list, OS_INT);            for count2 := 1 to Count do            begin              list.concat(taicpu.op_reg_ref(A_L32I, tmpreg1, src));              list.concat(taicpu.op_reg_ref(A_S32I, tmpreg1, dst));              Inc(src.offset, 4);              Inc(dst.offset, 4);            end;            len := len mod 4;          end;          if (len and 4) <> 0 then          begin            hreg := GetIntRegister(list, OS_INT);            a_load_ref_reg(list, OS_32, OS_32, src, hreg);            a_load_reg_ref(list, OS_32, OS_32, hreg, dst);            Inc(src.offset, 4);            Inc(dst.offset, 4);          end;          { copy the leftovers }          if (len and 2) <> 0 then          begin            hreg := GetIntRegister(list, OS_INT);            a_load_ref_reg(list, OS_16, OS_16, src, hreg);            a_load_reg_ref(list, OS_16, OS_16, hreg, dst);            Inc(src.offset, 2);            Inc(dst.offset, 2);          end;          if (len and 1) <> 0 then          begin            hreg := GetIntRegister(list, OS_INT);            a_load_ref_reg(list, OS_8, OS_8, src, hreg);            a_load_reg_ref(list, OS_8, OS_8, hreg, dst);          end;        end;      end;     procedure tcgcpu.a_loadfpu_reg_reg(list: TAsmList; fromsize,tosize: tcgsize; reg1, reg2: tregister);       var         ai: taicpu;       begin         if not(fromsize in [OS_32,OS_F32]) then           InternalError(2020032603);         ai := taicpu.op_reg_reg(A_MOV,reg2,reg1);         ai.oppostfix := PF_S;         list.concat(ai);       end;     procedure tcgcpu.a_loadfpu_ref_reg(list: TAsmList; fromsize,tosize: tcgsize; const ref: treference; reg: tregister);       var         href: treference;       begin         if not(fromsize in [OS_32,OS_F32]) then           InternalError(2020032602);         href:=ref;         if assigned(href.symbol) or           ((href.index<>NR_NO) and (href.offset<>0)) or           (((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then           fixref(list,href);         if (href.base<>NR_NO) and (href.index<>NR_NO) then           list.concat(taicpu.op_reg_ref(A_LSX,reg,href))         else           list.concat(taicpu.op_reg_ref(A_LSI,reg,href));         if fromsize<>tosize then           a_loadfpu_reg_reg(list,fromsize,tosize,reg,reg);       end;     procedure tcgcpu.a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);       var         href: treference;       begin         if not(fromsize in [OS_32,OS_F32]) then           InternalError(2020032604);         href:=ref;         if assigned(href.symbol) or           ((href.index<>NR_NO) and (href.offset<>0)) or           (((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then           fixref(list,href);         if (href.base<>NR_NO) and (href.index<>NR_NO) then           list.concat(taicpu.op_reg_ref(A_SSX,reg,href))         else           list.concat(taicpu.op_reg_ref(A_SSI,reg,href));       end;    procedure tcgcpu.a_loadfpu_intreg_reg(list : TAsmList; fromsize,tosize : tcgsize; intreg,fpureg : tregister);      begin        if not(tcgsize2size[fromsize]=4) or           not(tcgsize2size[tosize]=4) then          internalerror(2020091102);        list.concat(taicpu.op_reg_reg(A_WFR,fpureg,intreg));      end;    procedure tcgcpu.a_loadfpu_reg_intreg(list : TAsmList; fromsize,tosize : tcgsize; fpureg,intreg : tregister);      begin        if not(tcgsize2size[fromsize]=4) or           not(tcgsize2size[tosize]=4) then          internalerror(2020091202);        list.concat(taicpu.op_reg_reg(A_RFR,intreg,fpureg));      end;    procedure tcgcpu.maybeadjustresult(list : TAsmList; op : TOpCg; size : tcgsize; dst : tregister);      const        overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NEG];      begin        if (op in overflowops) and           (size in [OS_8,OS_S8,OS_16,OS_S16]) then          a_load_reg_reg(list,OS_32,size,dst,dst);      end;    procedure tcgcpu.g_overflowcheck(list: TAsmList; const Loc: tlocation; def: tdef);      begin        { no overflow checking yet }      end;    function tcgcpu.create_data_entry(symbol: TAsmSymbol;offset: asizeint): TAsmLabel;      var        hp: tai;      begin        hp:=tai(current_procinfo.aktlocaldata.first);        while assigned(hp) do          begin            if (hp.typ=ait_label) and assigned(hp.Next) and              (tai(hp.Next).typ=ait_const) and              (tai_const(hp.Next).consttype=aitconst_ptr) and              (tai_const(hp.Next).sym=symbol) and              (tai_const(hp.Next).endsym=nil) and              ((assigned(symbol) and (tai_const(hp.Next).symofs=offset)) or               (not(assigned(symbol)) and (tai_const(hp.Next).value=offset))              ) then              begin                Result:=tai_label(hp).labsym;                exit;              end;            hp:=tai(hp.Next);          end;        current_asmdata.getjumplabel(Result);        cg.a_label(current_procinfo.aktlocaldata,Result);        if assigned(symbol) then          current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(symbol,offset))        else          current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(offset));      end;    procedure tcgcpu.a_bit_scan_reg_reg(list: TAsmList; reverse,not_zero: boolean; srcsize, dstsize: TCGSize; src, dst: TRegister);      var        ai: taicpu;        tmpreg: TRegister;      begin        if reverse then          begin            list.Concat(taicpu.op_reg_reg(A_NSAU,dst,src));            tmpreg:=getintregister(list,OS_INT);            a_load_const_reg(list,OS_INT,31,tmpreg);            a_op_reg_reg_reg(list,OP_SUB,OS_INT,dst,tmpreg,dst);            tmpreg:=getintregister(list,OS_INT);            a_load_const_reg(list,OS_INT,255,tmpreg);            ai:=taicpu.op_reg_reg_reg(A_MOV,dst,tmpreg,src);            ai.condition:=C_EQZ;            list.Concat(ai);          end        else          Internalerror(2020092604);      end;    procedure tcg64fxtensa.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);      var        instr: taicpu;        no_carry: TAsmLabel;        tmpreg: TRegister;      begin        case op of          OP_NEG,          OP_NOT :            internalerror(2020030810);          else            ;        end;        case op of          OP_AND,OP_OR,OP_XOR:            begin              cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);              cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);            end;          OP_ADD:            begin              if (regsrc1.reglo=regdst.reglo) or (regsrc1.reghi=regdst.reghi) then                Internalerror(2020082205);              list.concat(taicpu.op_reg_reg_reg(A_ADD, regdst.reglo, regsrc2.reglo, regsrc1.reglo));              list.concat(taicpu.op_reg_reg_reg(A_ADD, regdst.reghi, regsrc2.reghi, regsrc1.reghi));              current_asmdata.getjumplabel(no_carry);              cg.a_cmp_reg_reg_label(list,OS_INT,OC_AE, regsrc1.reglo, regdst.reglo, no_carry);              list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, regdst.reghi, 1));              cg.a_label(list,no_carry);            end;          OP_SUB:            begin              if (regsrc1.reglo=regdst.reglo) or (regsrc1.reghi=regdst.reghi) then                Internalerror(2020082206);              { we need the original src2 value for the comparison, do not overwrite it }              if regsrc2.reglo=regdst.reglo then                begin                  tmpreg:=cg.GetIntRegister(list,OS_S32);                  cg.a_load_reg_reg(list,OS_INT,OS_INT,regsrc2.reglo,tmpreg);                  regsrc2.reglo:=tmpreg;                end;              list.concat(taicpu.op_reg_reg_reg(A_SUB, regdst.reglo, regsrc2.reglo, regsrc1.reglo));              list.concat(taicpu.op_reg_reg_reg(A_SUB, regdst.reghi, regsrc2.reghi, regsrc1.reghi));              current_asmdata.getjumplabel(no_carry);              cg.a_cmp_reg_reg_label(list,OS_INT,OC_AE, regsrc1.reglo, regsrc2.reglo, no_carry);              list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, regdst.reghi, -1));              cg.a_label(list,no_carry);            end;          else            internalerror(2020030813);        end;      end;    procedure tcg64fxtensa.a_op64_reg_reg(list : TAsmList; op : TOpCG; size : tcgsize; regsrc,regdst : tregister64);      var        tmpreg : TRegister;        instr : taicpu;      begin        case op of          OP_NEG:            begin              tmpreg:=cg.GetIntRegister(list, OS_INT);              list.concat(taicpu.op_reg_reg(A_NEG,regdst.reglo,regsrc.reglo));              list.concat(taicpu.op_reg_reg(A_NEG,regdst.reghi,regsrc.reghi));              list.concat(taicpu.op_reg_reg_const(A_ADDI,tmpreg,regdst.reghi,-1));              instr:=taicpu.op_reg_reg_reg(A_MOV,regdst.reghi,tmpreg,regdst.reglo);              instr.condition:=C_NEZ;              list.concat(instr);            end;          OP_NOT:            begin              cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);              cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);            end;          else            a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);        end;      end;    procedure tcg64fxtensa.a_op64_const_reg_reg(list : TAsmList; op : TOpCG; size : tcgsize; value : int64; regsrc,regdst : tregister64);      var        tmpreg64 : tregister64;        no_carry : TAsmLabel;        tmpreg: tregister;      begin        case op of          OP_NEG,          OP_NOT :            internalerror(2020030904);          else            ;        end;        case op of          OP_AND,OP_OR,OP_XOR:            begin              cg.a_op_const_reg_reg(list,op,OS_32,aint(lo(value)),regsrc.reglo,regdst.reglo);              cg.a_op_const_reg_reg(list,op,OS_32,aint(hi(value)),regsrc.reghi,regdst.reghi);            end;          OP_ADD:            begin              { could do better here (hi(value) in 248..2047), for now we support only the simple cases }              if (value>=-2048) and (value<=2047) then                begin                  { we need the original src value for the comparison, do not overwrite it }                  if regsrc.reglo=regdst.reglo then                    begin                      tmpreg:=cg.GetIntRegister(list,OS_S32);                      cg.a_load_reg_reg(list,OS_INT,OS_INT,regsrc.reglo,tmpreg);                      regsrc.reglo:=tmpreg;                    end;                  list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reglo, regsrc.reglo, value));                  list.concat(taicpu.op_reg_reg(A_MOV, regdst.reghi, regsrc.reghi));                  current_asmdata.getjumplabel(no_carry);                  cg.a_cmp_reg_reg_label(list,OS_INT,OC_AE, regsrc.reglo, regdst.reglo, no_carry);                  list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, regdst.reghi, 1));                  cg.a_label(list,no_carry);                  end                else                  begin                    tmpreg64.reglo := cg.GetIntRegister(list,OS_S32);                    tmpreg64.reghi := cg.GetIntRegister(list,OS_S32);                    a_load64_const_reg(list,value,tmpreg64);                    a_op64_reg_reg_reg(list,op,size,tmpreg64,regsrc,regdst);                  end;            end;          OP_SHL:            begin              if (value>0) and (value<=16) then                begin                  tmpreg:=cg.GetIntRegister(list,OS_32);                  list.concat(taicpu.op_reg_reg_const_const(A_EXTUI, tmpreg, regsrc.reglo, 32-value, value));                  list.concat(taicpu.op_reg_reg_const(A_SLLI, regdst.reglo, regsrc.reglo, value));                  list.concat(taicpu.op_reg_reg_const(A_SLLI, regdst.reghi, regsrc.reghi, value));                  list.concat(taicpu.op_reg_reg_reg(A_OR, regdst.reghi, tmpreg, regdst.reghi));                end              else if value=32 then                begin                  cg.a_load_reg_reg(list,OS_INT,OS_INT,regsrc.reglo,regdst.reghi);                  cg.a_load_const_reg(list,OS_INT,0,regdst.reglo);                end              else                Internalerror(2020082209);            end;          OP_SHR:            begin              if (value>0) and (value<=15) then                begin                  tmpreg:=cg.GetIntRegister(list,OS_32);                  list.concat(taicpu.op_reg_reg_const(A_SLLI, tmpreg, regsrc.reghi, 32-value));                  list.concat(taicpu.op_reg_reg_const(A_SRLI, regdst.reglo, regsrc.reglo, value));                  list.concat(taicpu.op_reg_reg_reg(A_OR, regdst.reglo, tmpreg, regdst.reglo));                  list.concat(taicpu.op_reg_reg_const(A_SRLI, regdst.reghi, regsrc.reghi, value));                end              else if value=32 then                begin                  cg.a_load_reg_reg(list,OS_INT,OS_INT,regsrc.reghi,regdst.reglo);                  cg.a_load_const_reg(list,OS_INT,0,regdst.reghi);                end              else                Internalerror(2020082210);            end;          OP_SUB:            begin              { for now, we take the simple approach }              tmpreg64.reglo := cg.GetIntRegister(list,OS_S32);              tmpreg64.reghi := cg.GetIntRegister(list,OS_S32);              a_load64_const_reg(list,value,tmpreg64);              a_op64_reg_reg_reg(list,op,size,tmpreg64,regsrc,regdst);            end;          else            internalerror(2020030901);        end;      end;    procedure tcg64fxtensa.a_op64_const_reg(list : TAsmList; op : TOpCG; size : tcgsize; value : int64; reg : tregister64);      begin        a_op64_const_reg_reg(list,op,size,value,reg,reg);      end;{$warnings off}    procedure create_codegen;      begin        cg:=tcgcpu.Create;        cg64:=tcg64fxtensa.Create;      end;end.
 |