| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876 | {    Copyright (c) 1998-2002 by Florian Klaempfl    This unit implements the code generator for the PowerPC    This program is free software; you can redistribute it and/or modify    it under the terms of the GNU General Public License as published by    the Free Software Foundation; either version 2 of the License, or    (at your option) any later version.    This program is distributed in the hope that it will be useful,    but WITHOUT ANY WARRANTY; without even the implied warranty of    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the    GNU General Public License for more details.    You should have received a copy of the GNU General Public License    along with this program; if not, write to the Free Software    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. ****************************************************************************}unit cgcpu;{$i fpcdefs.inc}  interface    uses       globtype,symtype,symdef,       cgbase,cgobj,cgppc,       aasmbase,aasmcpu,aasmtai,aasmdata,       cpubase,cpuinfo,cgutils,cg64f32,rgcpu,       parabase;    type      tcgppc = class(tcgppcgen)        procedure init_register_allocators;override;        procedure done_register_allocators;override;        { passing parameters, per default the parameter is pushed }        { nr gives the number of the parameter (enumerated from   }        { left to right), this allows to move the parameter to    }        { register, if the cpu supports register calling          }        { conventions                                             }        procedure a_param_ref(list : TAsmList;size : tcgsize;const r : treference;const paraloc : tcgpara);override;        procedure a_call_name(list : TAsmList;const s : string; weak: boolean);override;        procedure a_call_reg(list : TAsmList;reg: tregister); override;        procedure a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: aint; reg: TRegister); override;        procedure a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister); override;        procedure a_op_const_reg_reg(list: TAsmList; op: TOpCg;          size: tcgsize; a: aint; src, dst: tregister); override;        procedure a_op_reg_reg_reg(list: TAsmList; op: TOpCg;          size: tcgsize; src1, src2, dst: tregister); override;        { move instructions }        procedure a_load_const_reg(list : TAsmList; size: tcgsize; a : aint;reg : tregister);override;        procedure a_load_ref_reg(list : TAsmList; fromsize, tosize : tcgsize;const Ref : treference;reg : tregister);override;        procedure a_load_reg_reg(list : TAsmList; fromsize, tosize : tcgsize;reg1,reg2 : tregister);override;        procedure a_load_subsetreg_reg(list : TAsmList; subsetsize: tcgsize;          tosize: tcgsize; const sreg: tsubsetregister; destreg: tregister); override;        procedure a_load_subsetreg_subsetreg(list: TAsmlist; fromsubsetsize, tosubsetsize: tcgsize; const fromsreg, tosreg: tsubsetregister); override;        {  comparison operations }        procedure a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : aint;reg : tregister;          l : tasmlabel);override;        procedure a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;reg1,reg2 : tregister;l : tasmlabel); override;        procedure a_jmp_name(list : TAsmList;const s : string); override;        procedure a_jmp_always(list : TAsmList;l: tasmlabel); override;        procedure a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel); override;        procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister); override;        procedure g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);override;        procedure g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean); override;        procedure g_save_registers(list:TAsmList); override;        procedure g_restore_registers(list:TAsmList); override;        procedure g_concatcopy(list : TAsmList;const source,dest : treference;len : aint);override;        { find out whether a is of the form 11..00..11b or 00..11...00. If }        { that's the case, we can use rlwinm to do an AND operation        }        function get_rlwi_const(a: aint; var l1, l2: longint): boolean;      protected       procedure a_load_regconst_subsetreg_intern(list : TAsmList; fromsize, subsetsize: tcgsize; fromreg: tregister; const sreg: tsubsetregister; slopt: tsubsetloadopt); override;      private        (* NOT IN USE: *)        procedure g_stackframe_entry_mac(list : TAsmList;localsize : longint);        (* NOT IN USE: *)        procedure g_return_from_proc_mac(list : TAsmList;parasize : aint);        { clear out potential overflow bits from 8 or 16 bit operations  }        { the upper 24/16 bits of a register after an operation          }        procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);        { returns whether a reference can be used immediately in a powerpc }        { instruction                                                      }        function issimpleref(const ref: treference): boolean;        function save_regs(list : TAsmList):longint;        procedure restore_regs(list : TAsmList);     end;     tcg64fppc = class(tcg64f32)       procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;       procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;       procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;       procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;     end;const  TOpCG2AsmOpConstLo: Array[topcg] of TAsmOp = (A_NONE,A_MR,A_ADDI,A_ANDI_,A_DIVWU,                        A_DIVW,A_MULLW, A_MULLW, A_NONE,A_NONE,A_ORI,                        A_SRAWI,A_SLWI,A_SRWI,A_SUBI,A_XORI,A_NONE,A_NONE);  TOpCG2AsmOpConstHi: Array[topcg] of TAsmOp = (A_NONE,A_MR,A_ADDIS,A_ANDIS_,                        A_DIVWU,A_DIVW, A_MULLW,A_MULLW,A_NONE,A_NONE,                        A_ORIS,A_NONE, A_NONE,A_NONE,A_SUBIS,A_XORIS,A_NONE,A_NONE);  implementation    uses       globals,verbose,systems,cutils,       symconst,symsym,fmodule,       rgobj,tgobj,cpupi,procinfo,paramgr;    procedure tcgppc.init_register_allocators;      begin        inherited init_register_allocators;        if target_info.system=system_powerpc_darwin then          begin{            if pi_needs_got in current_procinfo.flags then              begin                current_procinfo.got:=NR_R31;                rg[R_INTREGISTER]:=trgcpu.create(R_INTREGISTER,R_SUBWHOLE,                  [RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,                   RS_R9,RS_R10,RS_R11,RS_R12,RS_R30,RS_R29,                   RS_R28,RS_R27,RS_R26,RS_R25,RS_R24,RS_R23,RS_R22,                   RS_R21,RS_R20,RS_R19,RS_R18,RS_R17,RS_R16,RS_R15,                   RS_R14,RS_R13],first_int_imreg,[]);              end            else}              rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,                [{$ifdef user0} RS_R0,{$endif} RS_R2,RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,                 RS_R9,RS_R10,RS_R11,RS_R12,RS_R31,RS_R30,RS_R29,                 RS_R28,RS_R27,RS_R26,RS_R25,RS_R24,RS_R23,RS_R22,                 RS_R21,RS_R20,RS_R19,RS_R18,RS_R17,RS_R16,RS_R15,                 RS_R14,RS_R13],first_int_imreg,[]);          end        else          rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,            [{$ifdef user0} RS_R0,{$endif}RS_R3,RS_R4,RS_R5,RS_R6,RS_R7,RS_R8,             RS_R9,RS_R10,RS_R11,RS_R12,RS_R31,RS_R30,RS_R29,             RS_R28,RS_R27,RS_R26,RS_R25,RS_R24,RS_R23,RS_R22,             RS_R21,RS_R20,RS_R19,RS_R18,RS_R17,RS_R16,RS_R15,             RS_R14,RS_R13],first_int_imreg,[]);        rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,            [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7,RS_F8,RS_F9,             RS_F10,RS_F11,RS_F12,RS_F13,RS_F31,RS_F30,RS_F29,RS_F28,RS_F27,             RS_F26,RS_F25,RS_F24,RS_F23,RS_F22,RS_F21,RS_F20,RS_F19,RS_F18,             RS_F17,RS_F16,RS_F15,RS_F14],first_fpu_imreg,[]);        { TODO: FIX ME}        rg[R_MMREGISTER]:=trgcpu.create(R_MMREGISTER,R_SUBNONE,            [RS_M0,RS_M1,RS_M2],first_mm_imreg,[]);      end;    procedure tcgppc.done_register_allocators;      begin        rg[R_INTREGISTER].free;        rg[R_FPUREGISTER].free;        rg[R_MMREGISTER].free;        inherited done_register_allocators;      end;    procedure tcgppc.a_param_ref(list : TAsmList;size : tcgsize;const r : treference;const paraloc : tcgpara);      var        tmpref, ref: treference;        location: pcgparalocation;        sizeleft: aint;      begin        location := paraloc.location;        tmpref := r;        sizeleft := paraloc.intsize;        while assigned(location) do          begin            case location^.loc of              LOC_REGISTER,LOC_CREGISTER:                begin{$ifndef cpu64bitaddr}                  if (sizeleft <> 3) then                    begin                      a_load_ref_reg(list,location^.size,location^.size,tmpref,location^.register);                    end                  else                    begin                      a_load_ref_reg(list,OS_16,OS_16,tmpref,location^.register);                      a_reg_alloc(list,NR_R0);                      inc(tmpref.offset,2);                      a_load_ref_reg(list,OS_8,OS_8,tmpref,newreg(R_INTREGISTER,RS_R0,R_SUBNONE));                      a_op_const_reg(list,OP_SHL,OS_INT,16,location^.register);                      list.concat(taicpu.op_reg_reg_const_const_const(A_RLWIMI,location^.register,newreg(R_INTREGISTER,RS_R0,R_SUBNONE),8,16,31-8));                      a_reg_dealloc(list,NR_R0);                      dec(tmpref.offset,2);                    end;{$else not cpu64bitaddr}{$error add 64 bit support for non power of 2 loads in a_param_ref}{$endif not cpu64bitaddr}                end;              LOC_REFERENCE:                begin                   reference_reset_base(ref,location^.reference.index,location^.reference.offset,paraloc.alignment);                   g_concatcopy(list,tmpref,ref,sizeleft);                   if assigned(location^.next) then                     internalerror(2005010710);                end;              LOC_FPUREGISTER,LOC_CFPUREGISTER:                case location^.size of                   OS_F32, OS_F64:                     a_loadfpu_ref_reg(list,location^.size,location^.size,tmpref,location^.register);                   else                     internalerror(2002072801);                end;              LOC_VOID:                begin                  // nothing to do                end;              else                internalerror(2002081103);            end;            inc(tmpref.offset,tcgsize2size[location^.size]);            dec(sizeleft,tcgsize2size[location^.size]);            location := location^.next;          end;      end;    { calling a procedure by name }    procedure tcgppc.a_call_name(list : TAsmList;const s : string; weak: boolean);      begin         { MacOS: The linker on MacOS (PPCLink) inserts a call to glue code,           if it is a cross-TOC call. If so, it also replaces the NOP           with some restore code.}         if (target_info.system <> system_powerpc_darwin) then           begin             if not(weak) then               list.concat(taicpu.op_sym(A_BL,current_asmdata.RefAsmSymbol(s)))             else               list.concat(taicpu.op_sym(A_BL,current_asmdata.WeakRefAsmSymbol(s)));             if target_info.system=system_powerpc_macos then               list.concat(taicpu.op_none(A_NOP));           end         else           list.concat(taicpu.op_sym(A_BL,get_darwin_call_stub(s,weak)));{       the compiler does not properly set this flag anymore in pass 1, and       for now we only need it after pass 2 (I hope) (JM)         if not(pi_do_call in current_procinfo.flags) then           internalerror(2003060703);}       include(current_procinfo.flags,pi_do_call);      end;    { calling a procedure by address }    procedure tcgppc.a_call_reg(list : TAsmList;reg: tregister);      var        tmpreg : tregister;        tmpref : treference;      begin        if target_info.system=system_powerpc_macos then          begin            {Generate instruction to load the procedure address from            the transition vector.}            //TODO: Support cross-TOC calls.            tmpreg := rg[R_INTREGISTER].getregister(list,R_SUBWHOLE);            reference_reset(tmpref,4);            tmpref.offset := 0;            //tmpref.symaddr := refs_full;            tmpref.base:= reg;            list.concat(taicpu.op_reg_ref(A_LWZ,tmpreg,tmpref));          end        else          tmpreg:=reg;        inherited a_call_reg(list,tmpreg);      end;{********************** load instructions ********************}     procedure tcgppc.a_load_const_reg(list : TAsmList; size: TCGSize; a : aint; reg : TRegister);       begin          if not(size in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then            internalerror(2002090902);          if (a >= low(smallint)) and             (a <= high(smallint)) then            list.concat(taicpu.op_reg_const(A_LI,reg,smallint(a)))          else if ((a and $ffff) <> 0) then            begin              list.concat(taicpu.op_reg_const(A_LI,reg,smallint(a and $ffff)));              if ((a shr 16) <> 0) or                 (smallint(a and $ffff) < 0) then                list.concat(taicpu.op_reg_reg_const(A_ADDIS,reg,reg,                  smallint((a shr 16)+ord(smallint(a and $ffff) < 0))))            end          else            list.concat(taicpu.op_reg_const(A_LIS,reg,smallint(a shr 16)));       end;     procedure tcgppc.a_load_ref_reg(list : TAsmList; fromsize,tosize : tcgsize;const ref: treference;reg : tregister);       const         LoadInstr: Array[OS_8..OS_S32,boolean, boolean] of TAsmOp =                                { indexed? updating?}                    (((A_LBZ,A_LBZU),(A_LBZX,A_LBZUX)),                     ((A_LHZ,A_LHZU),(A_LHZX,A_LHZUX)),                     ((A_LWZ,A_LWZU),(A_LWZX,A_LWZUX)),                     { 64bit stuff should be handled separately }                     ((A_NONE,A_NONE),(A_NONE,A_NONE)),                     { 128bit stuff too }                     ((A_NONE,A_NONE),(A_NONE,A_NONE)),                     { there's no load-byte-with-sign-extend :( }                     ((A_LBZ,A_LBZU),(A_LBZX,A_LBZUX)),                     ((A_LHA,A_LHAU),(A_LHAX,A_LHAUX)),                     ((A_LWZ,A_LWZU),(A_LWZX,A_LWZUX)));       var         op: tasmop;         ref2: treference;       begin          { TODO: optimize/take into consideration fromsize/tosize. Will }          { probably only matter for OS_S8 loads though                  }          if not(fromsize in [OS_8,OS_S8,OS_16,OS_S16,OS_32,OS_S32]) then            internalerror(2002090902);          ref2 := ref;          fixref(list,ref2);          { the caller is expected to have adjusted the reference already }          { in this case                                                  }          if (TCGSize2Size[fromsize] >= TCGSize2Size[tosize]) then            fromsize := tosize;          op := loadinstr[fromsize,ref2.index<>NR_NO,false];          a_load_store(list,op,reg,ref2);          { sign extend shortint if necessary (because there is	   no load instruction to sign extend an 8 bit value automatically)	   and mask out extra sign bits when loading from a smaller signed	   to a larger unsigned type }          if fromsize = OS_S8 then	    begin	      a_load_reg_reg(list, OS_8, OS_S8, reg, reg);	      a_load_reg_reg(list, OS_S8, tosize, reg, reg);	    end;       end;     procedure tcgppc.a_load_reg_reg(list : TAsmList;fromsize, tosize : tcgsize;reg1,reg2 : tregister);       var         instr: taicpu;       begin         if (tcgsize2size[fromsize] > tcgsize2size[tosize]) or            ((tcgsize2size[fromsize] = tcgsize2size[tosize]) and             (fromsize <> tosize)) or            { needs to mask out the sign in the top 16 bits }            ((fromsize = OS_S8) and             (tosize = OS_16)) then           case tosize of             OS_8:               instr := taicpu.op_reg_reg_const_const_const(A_RLWINM,                 reg2,reg1,0,31-8+1,31);             OS_S8:               instr := taicpu.op_reg_reg(A_EXTSB,reg2,reg1);             OS_16:               instr := taicpu.op_reg_reg_const_const_const(A_RLWINM,                 reg2,reg1,0,31-16+1,31);             OS_S16:               instr := taicpu.op_reg_reg(A_EXTSH,reg2,reg1);             OS_32,OS_S32:               instr := taicpu.op_reg_reg(A_MR,reg2,reg1);             else internalerror(2002090901);           end         else           instr := taicpu.op_reg_reg(A_MR,reg2,reg1);         list.concat(instr);         rg[R_INTREGISTER].add_move_instruction(instr);       end;     procedure tcgppc.a_load_subsetreg_reg(list : TAsmList; subsetsize, tosize: tcgsize; const sreg: tsubsetregister; destreg: tregister);       begin         if (sreg.bitlen > 32) then           internalerror(2008020701);         if (sreg.bitlen <> 32) then           begin             list.concat(taicpu.op_reg_reg_const_const_const(A_RLWINM,destreg,               sreg.subsetreg,(32-sreg.startbit) and 31,32-sreg.bitlen,31));             { types with a negative lower bound are always a base type (8, 16, 32 bits) }             if (subsetsize in [OS_S8..OS_S128]) then               if ((sreg.bitlen mod 8) = 0) then                 begin                   a_load_reg_reg(list,tcgsize2unsigned[subsetsize],subsetsize,destreg,destreg);                   a_load_reg_reg(list,subsetsize,tosize,destreg,destreg);                 end               else                 begin                   a_op_const_reg(list,OP_SHL,OS_INT,32-sreg.bitlen,destreg);                   a_op_const_reg(list,OP_SAR,OS_INT,32-sreg.bitlen,destreg);                 end;           end         else           a_load_reg_reg(list,subsetsize,tosize,sreg.subsetreg,destreg);       end;     procedure tcgppc.a_load_regconst_subsetreg_intern(list : TAsmList; fromsize, subsetsize: tcgsize; fromreg: tregister; const sreg: tsubsetregister; slopt: tsubsetloadopt);       begin         if (slopt in [SL_SETZERO,SL_SETMAX]) then           inherited a_load_regconst_subsetreg_intern(list,fromsize,subsetsize,fromreg,sreg,slopt)         else if (sreg.bitlen>32) then           internalerror(2008020702)         else if (sreg.bitlen <> 32) then           list.concat(taicpu.op_reg_reg_const_const_const(A_RLWIMI,sreg.subsetreg,fromreg,             sreg.startbit,32-sreg.startbit-sreg.bitlen,31-sreg.startbit))         else           a_load_reg_reg(list,fromsize,subsetsize,fromreg,sreg.subsetreg);       end;       procedure tcgppc.a_load_subsetreg_subsetreg(list: TAsmlist; fromsubsetsize, tosubsetsize: tcgsize; const fromsreg, tosreg: tsubsetregister);         begin           if (tosreg.bitlen>32) or (tosreg.startbit>31) then             internalerror(2008020703);           if (fromsreg.bitlen >= tosreg.bitlen) then             list.concat(taicpu.op_reg_reg_const_const_const(A_RLWIMI,tosreg.subsetreg, fromsreg.subsetreg,                (tosreg.startbit-fromsreg.startbit) and 31,                32-tosreg.startbit-tosreg.bitlen,31-tosreg.startbit))           else             inherited a_load_subsetreg_subsetreg(list,fromsubsetsize,tosubsetsize,fromsreg,tosreg);         end;     procedure tcgppc.a_op_const_reg(list : TAsmList; Op: TOpCG; size: TCGSize; a: aint; reg: TRegister);       begin         a_op_const_reg_reg(list,op,size,a,reg,reg);       end;      procedure tcgppc.a_op_reg_reg(list : TAsmList; Op: TOpCG; size: TCGSize; src, dst: TRegister);         begin           a_op_reg_reg_reg(list,op,size,src,dst,dst);         end;    procedure tcgppc.maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);      const        overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NOT,OP_NEG];      begin        if (op in overflowops) and           (size in [OS_8,OS_S8,OS_16,OS_S16]) then          a_load_reg_reg(list,OS_32,size,dst,dst);      end;    procedure tcgppc.a_op_const_reg_reg(list: TAsmList; op: TOpCg;                       size: tcgsize; a: aint; src, dst: tregister);      var        l1,l2: longint;        oplo, ophi: tasmop;        scratchreg: tregister;        useReg, gotrlwi: boolean;        procedure do_lo_hi;          begin            list.concat(taicpu.op_reg_reg_const(oplo,dst,src,word(a)));            list.concat(taicpu.op_reg_reg_const(ophi,dst,dst,word(a shr 16)));          end;      begin        if (op = OP_MOVE) then          internalerror(2006031401);        if op = OP_SUB then          begin            a_op_const_reg_reg(list,OP_ADD,size,-a,src,dst);            exit;          end;        ophi := TOpCG2AsmOpConstHi[op];        oplo := TOpCG2AsmOpConstLo[op];        gotrlwi := get_rlwi_const(a,l1,l2);        if (op in [OP_AND,OP_OR,OP_XOR]) then          begin            if (a = 0) then              begin                if op = OP_AND then                  list.concat(taicpu.op_reg_const(A_LI,dst,0))                else                  a_load_reg_reg(list,size,size,src,dst);                exit;              end            else if (a = -1) then              begin                case op of                  OP_OR:                    list.concat(taicpu.op_reg_const(A_LI,dst,-1));                  OP_XOR:                    list.concat(taicpu.op_reg_reg(A_NOT,dst,src));                  OP_AND:                    a_load_reg_reg(list,size,size,src,dst);                end;                exit;              end            else if (aword(a) <= high(word)) and               ((op <> OP_AND) or                not gotrlwi) then              begin                if ((size = OS_8) and                    (byte(a) <> a)) or                   ((size = OS_S8) and                    (shortint(a) <> a)) then                  internalerror(200604142);                list.concat(taicpu.op_reg_reg_const(oplo,dst,src,word(a)));                { and/or/xor -> cannot overflow in high 16 bits }                exit;              end;            { all basic constant instructions also have a shifted form that }            { works only on the highest 16bits, so if lo(a) is 0, we can    }            { use that one                                                  }            if (word(a) = 0) and               (not(op = OP_AND) or                not gotrlwi) then              begin                if (size in [OS_8,OS_S8,OS_16,OS_S16]) then                  internalerror(200604141);                list.concat(taicpu.op_reg_reg_const(ophi,dst,src,word(a shr 16)));                exit;              end;          end        else if (op = OP_ADD) then          if a = 0 then            begin              a_load_reg_reg(list,size,size,src,dst);              exit            end          else if (a >= low(smallint)) and                  (a <= high(smallint)) then             begin               list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,src,smallint(a)));               maybeadjustresult(list,op,size,dst);               exit;             end;        { otherwise, the instructions we can generate depend on the }        { operation                                                 }        useReg := false;        case op of          OP_DIV,OP_IDIV:             if (a = 0) then               internalerror(200208103)             else if (a = 1) then               begin                 a_load_reg_reg(list,OS_INT,OS_INT,src,dst);                 exit               end            else if ispowerof2(a,l1) then              begin                case op of                  OP_DIV:                    list.concat(taicpu.op_reg_reg_const(A_SRWI,dst,src,l1));                  OP_IDIV:                    begin                       list.concat(taicpu.op_reg_reg_const(A_SRAWI,dst,src,l1));                       list.concat(taicpu.op_reg_reg(A_ADDZE,dst,dst));                    end;                end;                exit;              end            else              usereg := true;           OP_IMUL, OP_MUL:             if (a = 0) then               begin                 list.concat(taicpu.op_reg_const(A_LI,dst,0));                 exit               end             else if (a = 1) then               begin                 a_load_reg_reg(list,OS_INT,OS_INT,src,dst);                 exit               end             else if ispowerof2(a,l1) then               list.concat(taicpu.op_reg_reg_const(A_SLWI,dst,src,l1))             else if (longint(a) >= low(smallint)) and                (longint(a) <= high(smallint)) then               list.concat(taicpu.op_reg_reg_const(A_MULLI,dst,src,smallint(a)))             else               usereg := true;          OP_ADD:            begin              list.concat(taicpu.op_reg_reg_const(oplo,dst,src,smallint(a)));              list.concat(taicpu.op_reg_reg_const(ophi,dst,dst,                smallint((a shr 16) + ord(smallint(a) < 0))));            end;          OP_OR:            { try to use rlwimi }            if gotrlwi and               (src = dst) then              begin                scratchreg := rg[R_INTREGISTER].getregister(list,R_SUBWHOLE);                list.concat(taicpu.op_reg_const(A_LI,scratchreg,-1));                list.concat(taicpu.op_reg_reg_const_const_const(A_RLWIMI,dst,                  scratchreg,0,l1,l2));              end            else              do_lo_hi;          OP_AND:            { try to use rlwinm }            if gotrlwi then              list.concat(taicpu.op_reg_reg_const_const_const(A_RLWINM,dst,                src,0,l1,l2))            else              useReg := true;          OP_XOR:            do_lo_hi;          OP_SHL,OP_SHR,OP_SAR:            begin              if (a and 31) <> 0 Then                list.concat(taicpu.op_reg_reg_const(                  TOpCG2AsmOpConstLo[Op],dst,src,a and 31))              else                a_load_reg_reg(list,size,size,src,dst);              if (a shr 5) <> 0 then                internalError(68991);            end;	  OP_ROL:	    begin	      if (not (size in [OS_32, OS_S32])) then begin	        internalerror(2008091307);	      end;    	      list.concat(taicpu.op_reg_reg_const_const_const(A_RLWINM, dst, src, a and 31, 0, 31));	    end;	  OP_ROR:	    begin	      if (not (size in [OS_32, OS_S32])) then begin		internalerror(2008091308);	      end;    	      list.concat(taicpu.op_reg_reg_const_const_const(A_RLWINM, dst, src, (32 - a) and 31, 0, 31));	    end          else            internalerror(200109091);        end;        { if all else failed, load the constant in a register and then }        { perform the operation                                        }        if useReg then          begin            scratchreg := rg[R_INTREGISTER].getregister(list,R_SUBWHOLE);            a_load_const_reg(list,OS_32,a,scratchreg);            a_op_reg_reg_reg(list,op,OS_32,scratchreg,src,dst);          end;        maybeadjustresult(list,op,size,dst);      end;    procedure tcgppc.a_op_reg_reg_reg(list: TAsmList; op: TOpCg;      size: tcgsize; src1, src2, dst: tregister);      const        op_reg_reg_opcg2asmop: array[TOpCG] of tasmop =          (A_NONE,A_MR,A_ADD,A_AND,A_DIVWU,A_DIVW,A_MULLW,A_MULLW,A_NEG,A_NOT,A_OR,           A_SRAW,A_SLW,A_SRW,A_SUB,A_XOR,A_NONE,A_NONE);      var        tmpreg : TRegister;       begin         if (op = OP_MOVE) then           internalerror(2006031402);         case op of           OP_NEG,OP_NOT:             begin               list.concat(taicpu.op_reg_reg(op_reg_reg_opcg2asmop[op],dst,src1));               if (op = OP_NOT) and                  not(size in [OS_32,OS_S32]) then                 { zero/sign extend result again }                 a_load_reg_reg(list,OS_32,size,dst,dst);              end;	   OP_ROL:	     begin	       if (not (size in [OS_32, OS_S32])) then begin	         internalerror(2008091305);	       end;	       list.concat(taicpu.op_reg_reg_reg_const_const(A_RLWNM, dst, src2, src1, 0, 31));	     end;	   OP_ROR:	     begin	       if (not (size in [OS_32, OS_S32])) then begin	         internalerror(2008091306);	       end;	       tmpreg := getintregister(current_asmdata.CurrAsmList, OS_INT);	       list.concat(taicpu.op_reg_reg(A_NEG, tmpreg, src1));	       list.concat(taicpu.op_reg_reg_reg_const_const(A_RLWNM, dst, src2, tmpreg, 0, 31));	     end;	           else             list.concat(taicpu.op_reg_reg_reg(op_reg_reg_opcg2asmop[op],dst,src2,src1));         end;         maybeadjustresult(list,op,size,dst);       end;{*************** compare instructructions ****************}      procedure tcgppc.a_cmp_const_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;a : aint;reg : tregister;        l : tasmlabel);        var          scratch_register: TRegister;          signed: boolean;        begin          signed := cmp_op in [OC_GT,OC_LT,OC_GTE,OC_LTE,OC_EQ,OC_NE];          { in the following case, we generate more efficient code when }          { signed is false                                              }          if (cmp_op in [OC_EQ,OC_NE]) and             (aword(a) >= $8000) and             (aword(a) <= $ffff) then            signed := false;          if signed then            if (a >= low(smallint)) and (a <= high(smallint)) Then              list.concat(taicpu.op_reg_reg_const(A_CMPWI,NR_CR0,reg,a))            else              begin                scratch_register := rg[R_INTREGISTER].getregister(list,R_SUBWHOLE);                a_load_const_reg(list,OS_32,a,scratch_register);                list.concat(taicpu.op_reg_reg_reg(A_CMPW,NR_CR0,reg,scratch_register));              end          else            if (aword(a) <= $ffff) then              list.concat(taicpu.op_reg_reg_const(A_CMPLWI,NR_CR0,reg,aword(a)))            else              begin                scratch_register := rg[R_INTREGISTER].getregister(list,R_SUBWHOLE);                a_load_const_reg(list,OS_32,a,scratch_register);                list.concat(taicpu.op_reg_reg_reg(A_CMPLW,NR_CR0,reg,scratch_register));              end;          a_jmp(list,A_BC,TOpCmp2AsmCond[cmp_op],0,l);        end;      procedure tcgppc.a_cmp_reg_reg_label(list : TAsmList;size : tcgsize;cmp_op : topcmp;        reg1,reg2 : tregister;l : tasmlabel);        var          op: tasmop;        begin          if cmp_op in [OC_GT,OC_LT,OC_GTE,OC_LTE] then            op := A_CMPW          else            op := A_CMPLW;          list.concat(taicpu.op_reg_reg_reg(op,NR_CR0,reg2,reg1));          a_jmp(list,A_BC,TOpCmp2AsmCond[cmp_op],0,l);        end;    procedure tcgppc.a_jmp_name(list : TAsmList;const s : string);      var        p : taicpu;      begin         if (target_info.system = system_powerpc_darwin) then           p := taicpu.op_sym(A_B,get_darwin_call_stub(s,false))        else          p := taicpu.op_sym(A_B,current_asmdata.RefAsmSymbol(s));        p.is_jmp := true;        list.concat(p)      end;     procedure tcgppc.a_jmp_always(list : TAsmList;l: tasmlabel);       begin         a_jmp(list,A_B,C_None,0,l);       end;     procedure tcgppc.a_jmp_flags(list : TAsmList;const f : TResFlags;l: tasmlabel);       var         c: tasmcond;       begin         c := flags_to_cond(f);         a_jmp(list,A_BC,c.cond,c.cr-RS_CR0,l);       end;     procedure tcgppc.g_flags2reg(list: TAsmList; size: TCgSize; const f: TResFlags; reg: TRegister);       var         testbit: byte;         bitvalue: boolean;       begin         { get the bit to extract from the conditional register + its }         { requested value (0 or 1)                                   }         testbit := ((f.cr-RS_CR0) * 4);         case f.flag of           F_EQ,F_NE:             begin               inc(testbit,2);               bitvalue := f.flag = F_EQ;             end;           F_LT,F_GE:             begin               bitvalue := f.flag = F_LT;             end;           F_GT,F_LE:             begin               inc(testbit);               bitvalue := f.flag = F_GT;             end;           else             internalerror(200112261);         end;         { load the conditional register in the destination reg }         list.concat(taicpu.op_reg(A_MFCR,reg));         { we will move the bit that has to be tested to bit 0 by rotating }         { left                                                            }         testbit := (testbit + 1) and 31;         { extract bit }         list.concat(taicpu.op_reg_reg_const_const_const(           A_RLWINM,reg,reg,testbit,31,31));         { if we need the inverse, xor with 1 }         if not bitvalue then           list.concat(taicpu.op_reg_reg_const(A_XORI,reg,reg,1));       end;(*     procedure tcgppc.g_cond2reg(list: TAsmList; const f: TAsmCond; reg: TRegister);       var         testbit: byte;         bitvalue: boolean;       begin         { get the bit to extract from the conditional register + its }         { requested value (0 or 1)                                   }         case f.simple of           false:             begin               { we don't generate this in the compiler }               internalerror(200109062);             end;           true:             case f.cond of               C_None:                 internalerror(200109063);               C_LT..C_NU:                 begin                   testbit := (ord(f.cr) - ord(R_CR0))*4;                   inc(testbit,AsmCondFlag2BI[f.cond]);                   bitvalue := AsmCondFlagTF[f.cond];                 end;               C_T,C_F,C_DNZT,C_DNZF,C_DZT,C_DZF:                 begin                   testbit := f.crbit                   bitvalue := AsmCondFlagTF[f.cond];                 end;               else                 internalerror(200109064);             end;         end;         { load the conditional register in the destination reg }         list.concat(taicpu.op_reg_reg(A_MFCR,reg));         { we will move the bit that has to be tested to bit 31 -> rotate }         { left by bitpos+1 (remember, this is big-endian!)               }         if bitpos <> 31 then           inc(bitpos)         else           bitpos := 0;         { extract bit }         list.concat(taicpu.op_reg_reg_const_const_const(           A_RLWINM,reg,reg,bitpos,31,31));         { if we need the inverse, xor with 1 }         if not bitvalue then           list.concat(taicpu.op_reg_reg_const(A_XORI,reg,reg,1));       end;*){ *********** entry/exit code and address loading ************ }    procedure tcgppc.g_save_registers(list:TAsmList);      begin        { this work is done in g_proc_entry }      end;    procedure tcgppc.g_restore_registers(list:TAsmList);      begin        { this work is done in g_proc_exit }      end;    procedure tcgppc.g_proc_entry(list : TAsmList;localsize : longint;nostackframe:boolean);     { generated the entry code of a procedure/function. Note: localsize is the }     { sum of the size necessary for local variables and the maximum possible   }     { combined size of ALL the parameters of a procedure called by the current }     { one.                                                                     }     { This procedure may be called before, as well as after g_return_from_proc }     { is called. NOTE registers are not to be allocated through the register   }     { allocator here, because the register colouring has already occured !!    }     var regcounter,firstregfpu,firstregint: TSuperRegister;         href : treference;         usesfpr,usesgpr : boolean;      begin        { CR and LR only have to be saved in case they are modified by the current }        { procedure, but currently this isn't checked, so save them always         }        { following is the entry code as described in "Altivec Programming }        { Interface Manual", bar the saving of AltiVec registers           }        a_reg_alloc(list,NR_STACK_POINTER_REG);        usesgpr := false;        usesfpr := false;        if not(po_assembler in current_procinfo.procdef.procoptions) then          begin            { save link register? }            if save_lr_in_prologue then              begin                a_reg_alloc(list,NR_R0);                { save return address... }                { warning: if this is no longer done via r0, or if r0 is       }                { added to the usable registers, adapt tcgppcgen.g_profilecode }                list.concat(taicpu.op_reg(A_MFLR,NR_R0));                { ... in caller's frame }                case target_info.abi of                  abi_powerpc_aix:                    reference_reset_base(href,NR_STACK_POINTER_REG,LA_LR_AIX,4);                  abi_powerpc_sysv:                    reference_reset_base(href,NR_STACK_POINTER_REG,LA_LR_SYSV,4);                end;                list.concat(taicpu.op_reg_ref(A_STW,NR_R0,href));                if not(cs_profile in current_settings.moduleswitches) then                  a_reg_dealloc(list,NR_R0);              end;(*            { save the CR if necessary in callers frame. }            if target_info.abi = abi_powerpc_aix then              if false then { Not needed at the moment. }                begin                  a_reg_alloc(list,NR_R0);                  list.concat(taicpu.op_reg_reg(A_MFSPR,NR_R0,NR_CR));                  reference_reset_base(href,NR_STACK_POINTER_REG,LA_CR_AIX);                  list.concat(taicpu.op_reg_ref(A_STW,NR_R0,href));                  a_reg_dealloc(list,NR_R0);                end;*)            firstregfpu := tppcprocinfo(current_procinfo).get_first_save_fpu_reg;            firstregint := tppcprocinfo(current_procinfo).get_first_save_int_reg;            usesgpr := firstregint <> 32;            usesfpr := firstregfpu <> 32;             if (tppcprocinfo(current_procinfo).needs_frame_pointer) then              begin                a_reg_alloc(list,NR_R12);                list.concat(taicpu.op_reg_reg(A_MR,NR_R12,NR_STACK_POINTER_REG));              end;          end;        if usesfpr then          begin             reference_reset_base(href,NR_R1,-8,8);             for regcounter:=firstregfpu to RS_F31 do               begin                 a_loadfpu_reg_ref(list,OS_F64,OS_F64,newreg(R_FPUREGISTER,regcounter,R_SUBNONE),href);                 dec(href.offset,8);               end;             { compute start of gpr save area }             inc(href.offset,4);          end        else          { compute start of gpr save area }          reference_reset_base(href,NR_R1,-4,4);        { save gprs and fetch GOT pointer }        if usesgpr then          begin            if (firstregint <= RS_R22) or               ((cs_opt_size in current_settings.optimizerswitches) and               { with RS_R30 it's also already smaller, but too big a speed trade-off to make }                (firstregint <= RS_R29)) then              begin                { TODO: TODO: 64 bit support }                dec(href.offset,(RS_R31-firstregint)*sizeof(pint));                list.concat(taicpu.op_reg_ref(A_STMW,newreg(R_INTREGISTER,firstregint,R_SUBNONE),href));              end            else              for regcounter:=firstregint to RS_R31 do                begin                  a_load_reg_ref(list,OS_INT,OS_INT,newreg(R_INTREGISTER,regcounter,R_SUBNONE),href);                  dec(href.offset,4);                end;          end;{        done in ncgutil because it may only be released after the parameters }{        have been moved to their final resting place                         }{        if (tppcprocinfo(current_procinfo).needs_frame_pointer) then }{          a_reg_dealloc(list,NR_R12); }        if (not nostackframe) and           tppcprocinfo(current_procinfo).needstackframe and           (localsize <> 0) then          begin            if (localsize <= high(smallint)) then              begin                reference_reset_base(href,NR_STACK_POINTER_REG,-localsize,8);                a_load_store(list,A_STWU,NR_STACK_POINTER_REG,href);              end            else              begin                reference_reset_base(href,NR_STACK_POINTER_REG,0,4);                { can't use getregisterint here, the register colouring }                { is already done when we get here                      }                { R12 may hold previous stack pointer, R11  may be in   }                { use as got => use R0 (but then we can't use           }                { a_load_const_reg)                                     }                href.index := NR_R0;                a_reg_alloc(list,href.index);                list.concat(taicpu.op_reg_const(A_LI,NR_R0,smallint((-localsize) and $ffff)));                if (smallint((-localsize) and $ffff) < 0) then                  { upper 16 bits are now $ffff -> xor with inverse }                  list.concat(taicpu.op_reg_reg_const(A_XORIS,NR_R0,NR_R0,word(not(((-localsize) shr 16) and $ffff))))                else                  list.concat(taicpu.op_reg_reg_const(A_ORIS,NR_R0,NR_R0,word(((-localsize) shr 16) and $ffff)));                a_load_store(list,A_STWUX,NR_STACK_POINTER_REG,href);                a_reg_dealloc(list,href.index);              end;          end;        { save the CR if necessary ( !!! never done currently ) }{       still need to find out where this has to be done for SystemV        a_reg_alloc(list,R_0);        list.concat(taicpu.op_reg_reg(A_MFSPR,R_0,R_CR);        list.concat(taicpu.op_reg_ref(A_STW,scratch_register,          new_reference(STACK_POINTER_REG,LA_CR)));        a_reg_dealloc(list,R_0);}        { now comes the AltiVec context save, not yet implemented !!! }      end;    procedure tcgppc.g_proc_exit(list : TAsmList;parasize : longint;nostackframe:boolean);     { This procedure may be called before, as well as after g_stackframe_entry }     { is called. NOTE registers are not to be allocated through the register   }     { allocator here, because the register colouring has already occured !!    }      var         regcounter,firstregfpu,firstregint: TsuperRegister;         href : treference;         usesfpr,usesgpr,genret : boolean;         localsize: aint;      begin        { AltiVec context restore, not yet implemented !!! }        usesfpr:=false;        usesgpr:=false;        if not (po_assembler in current_procinfo.procdef.procoptions) then          begin            firstregfpu := tppcprocinfo(current_procinfo).get_first_save_fpu_reg;            firstregint := tppcprocinfo(current_procinfo).get_first_save_int_reg;            usesgpr := firstregint <> 32;            usesfpr := firstregfpu <> 32;          end;        localsize:= tppcprocinfo(current_procinfo).calc_stackframe_size;        { adjust r1 }        { (register allocator is no longer valid at this time and an add of 0   }        { is translated into a move, which is then registered with the register }        { allocator, causing a crash                                            }        if (not nostackframe) and           tppcprocinfo(current_procinfo).needstackframe and           (localsize <> 0) then          a_op_const_reg(list,OP_ADD,OS_ADDR,localsize,NR_R1);        { no return (blr) generated yet }        genret:=true;        if usesfpr then          begin            reference_reset_base(href,NR_R1,-8,8);            for regcounter := firstregfpu to RS_F31 do              begin                a_loadfpu_ref_reg(list,OS_F64,OS_F64,href,newreg(R_FPUREGISTER,regcounter,R_SUBNONE));                dec(href.offset,8);              end;            inc(href.offset,4);          end        else          reference_reset_base(href,NR_R1,-4,4);        if (usesgpr) then          begin            if (firstregint <= RS_R22) or               ((cs_opt_size in current_settings.optimizerswitches) and                { with RS_R30 it's also already smaller, but too big a speed trade-off to make }                (firstregint <= RS_R29)) then              begin                { TODO: TODO: 64 bit support }                dec(href.offset,(RS_R31-firstregint)*sizeof(pint));                list.concat(taicpu.op_reg_ref(A_LMW,newreg(R_INTREGISTER,firstregint,R_SUBNONE),href));              end            else              for regcounter:=firstregint to RS_R31 do                begin                  a_load_ref_reg(list,OS_INT,OS_INT,href,newreg(R_INTREGISTER,regcounter,R_SUBNONE));                  dec(href.offset,4);                end;          end;(*        { restore fprs and return }        if usesfpr then          begin             { address of fpr save area to r11 }             r:=NR_R12;             list.concat(taicpu.op_reg_reg_const(A_ADDI,r,r,(ord(R_F31)-ord(firstregfpu.enum)+1)*8));             {             if (pi_do_call in current_procinfo.flags) then               a_call_name(current_asmdata.RefAsmSymbol('_restfpr_'+tostr(ord(firstregfpu)-ord(R_F14)+14)+'_x'))             else               { leaf node => lr haven't to be restored }               a_call_name('_restfpr_'+tostr(ord(firstregfpu.enum)-ord(R_F14)+14)+'_l');             genret:=false;             }          end;*)        { if we didn't generate the return code, we've to do it now }        if genret then          begin            { load link register? }            if not (po_assembler in current_procinfo.procdef.procoptions) then              begin                if (pi_do_call in current_procinfo.flags) then                  begin                    case target_info.abi of                      abi_powerpc_aix:                        reference_reset_base(href,NR_STACK_POINTER_REG,LA_LR_AIX,4);                      abi_powerpc_sysv:                        reference_reset_base(href,NR_STACK_POINTER_REG,LA_LR_SYSV,4);                    end;                    a_reg_alloc(list,NR_R0);                    list.concat(taicpu.op_reg_ref(A_LWZ,NR_R0,href));                    list.concat(taicpu.op_reg(A_MTLR,NR_R0));                    a_reg_dealloc(list,NR_R0);                  end;(*                  { restore the CR if necessary from callers frame}                  if target_info.abi = abi_powerpc_aix then                    if false then { Not needed at the moment. }                      begin                        reference_reset_base(href,NR_STACK_POINTER_REG,LA_CR_AIX);                        list.concat(taicpu.op_reg_ref(A_LWZ,NR_R0,href));                        list.concat(taicpu.op_reg_reg(A_MTSPR,NR_R0,NR_CR));                        a_reg_dealloc(list,NR_R0);                      end;*)              end;            list.concat(taicpu.op_none(A_BLR));          end;      end;    function tcgppc.save_regs(list : TAsmList):longint;    {Generates code which saves used non-volatile registers in     the save area right below the address the stackpointer point to.     Returns the actual used save area size.}     var regcounter,firstregfpu,firstreggpr: TSuperRegister;         usesfpr,usesgpr: boolean;         href : treference;         offset: aint;         regcounter2, firstfpureg: Tsuperregister;    begin      usesfpr:=false;      if not (po_assembler in current_procinfo.procdef.procoptions) then        begin            { FIXME: has to be R_F14 instad of R_F8 for SYSV-64bit }            case target_info.abi of              abi_powerpc_aix:                firstfpureg := RS_F14;              abi_powerpc_sysv:                firstfpureg := RS_F9;              else                internalerror(2003122903);            end;          for regcounter:=firstfpureg to RS_F31 do           begin             if regcounter in rg[R_FPUREGISTER].used_in_proc then              begin                 usesfpr:=true;                 firstregfpu:=regcounter;                 break;              end;           end;        end;      usesgpr:=false;      if not (po_assembler in current_procinfo.procdef.procoptions) then        for regcounter2:=RS_R13 to RS_R31 do          begin            if regcounter2 in rg[R_INTREGISTER].used_in_proc then              begin                 usesgpr:=true;                 firstreggpr:=regcounter2;                 break;              end;          end;      offset:= 0;      { save floating-point registers }      if usesfpr then        for regcounter := firstregfpu to RS_F31 do          begin            offset:= offset - 8;            reference_reset_base(href, NR_STACK_POINTER_REG, offset, 8);            list.concat(taicpu.op_reg_ref(A_STFD, tregister(regcounter), href));          end;        (* Optimiztion in the future:  a_call_name(list,'_savefXX'); *)      { save gprs in gpr save area }      if usesgpr then        if firstreggpr < RS_R30 then          begin            offset:= offset - 4 * (RS_R31 - firstreggpr + 1);            reference_reset_base(href,NR_STACK_POINTER_REG,offset,4);            list.concat(taicpu.op_reg_ref(A_STMW,tregister(firstreggpr),href));              {STMW stores multiple registers}          end        else          begin            for regcounter := firstreggpr to RS_R31 do              begin                offset:= offset - 4;                reference_reset_base(href, NR_STACK_POINTER_REG, offset, 4);                list.concat(taicpu.op_reg_ref(A_STW, newreg(R_INTREGISTER,regcounter,R_SUBWHOLE), href));              end;          end;      { now comes the AltiVec context save, not yet implemented !!! }      save_regs:= -offset;    end;    procedure tcgppc.restore_regs(list : TAsmList);    {Generates code which restores used non-volatile registers from    the save area right below the address the stackpointer point to.}     var regcounter,firstregfpu,firstreggpr: TSuperRegister;         usesfpr,usesgpr: boolean;         href : treference;         offset: integer;         regcounter2, firstfpureg: Tsuperregister;    begin      usesfpr:=false;      if not (po_assembler in current_procinfo.procdef.procoptions) then        begin          { FIXME: has to be R_F14 instad of R_F8 for SYSV-64bit }          case target_info.abi of            abi_powerpc_aix:              firstfpureg := RS_F14;            abi_powerpc_sysv:              firstfpureg := RS_F9;            else              internalerror(2003122903);          end;          for regcounter:=firstfpureg to RS_F31 do           begin             if regcounter in rg[R_FPUREGISTER].used_in_proc then              begin                 usesfpr:=true;                 firstregfpu:=regcounter;                 break;              end;           end;        end;      usesgpr:=false;      if not (po_assembler in current_procinfo.procdef.procoptions) then        for regcounter2:=RS_R13 to RS_R31 do          begin            if regcounter2 in rg[R_INTREGISTER].used_in_proc then              begin                 usesgpr:=true;                 firstreggpr:=regcounter2;                 break;              end;          end;      offset:= 0;      { restore fp registers }      if usesfpr then        for regcounter := firstregfpu to RS_F31 do          begin            offset:= offset - 8;            reference_reset_base(href, NR_STACK_POINTER_REG, offset, 8);            list.concat(taicpu.op_reg_ref(A_LFD, newreg(R_FPUREGISTER,regcounter,R_SUBWHOLE), href));          end;        (* Optimiztion in the future: a_call_name(list,'_restfXX'); *)      { restore gprs }      if usesgpr then        if firstreggpr < RS_R30 then          begin            offset:= offset - 4 * (RS_R31 - firstreggpr + 1);            reference_reset_base(href,NR_STACK_POINTER_REG,offset, 4); //-220            list.concat(taicpu.op_reg_ref(A_LMW,tregister(firstreggpr),href));              {LMW loads multiple registers}          end        else          begin            for regcounter := firstreggpr to RS_R31 do              begin                offset:= offset - 4;                reference_reset_base(href, NR_STACK_POINTER_REG, offset, 4);                list.concat(taicpu.op_reg_ref(A_LWZ, newreg(R_INTREGISTER,regcounter,R_SUBWHOLE), href));              end;          end;      { now comes the AltiVec context restore, not yet implemented !!! }    end;    procedure tcgppc.g_stackframe_entry_mac(list : TAsmList;localsize : longint); (* NOT IN USE *) { generated the entry code of a procedure/function. Note: localsize is the } { sum of the size necessary for local variables and the maximum possible   } { combined size of ALL the parameters of a procedure called by the current } { one                                                                     }     const         macosLinkageAreaSize = 24;     var         href : treference;         registerSaveAreaSize : longint;      begin        if (localsize mod 8) <> 0 then          internalerror(58991);        { CR and LR only have to be saved in case they are modified by the current }        { procedure, but currently this isn't checked, so save them always         }        { following is the entry code as described in "Altivec Programming }        { Interface Manual", bar the saving of AltiVec registers           }        a_reg_alloc(list,NR_STACK_POINTER_REG);        a_reg_alloc(list,NR_R0);        { save return address in callers frame}        list.concat(taicpu.op_reg_reg(A_MFSPR,NR_R0,NR_LR));        { ... in caller's frame }        reference_reset_base(href,NR_STACK_POINTER_REG,8, 8);        list.concat(taicpu.op_reg_ref(A_STW,NR_R0,href));        a_reg_dealloc(list,NR_R0);        { save non-volatile registers in callers frame}        registerSaveAreaSize:= save_regs(list);        { save the CR if necessary in callers frame ( !!! always done currently ) }        a_reg_alloc(list,NR_R0);        list.concat(taicpu.op_reg_reg(A_MFSPR,NR_R0,NR_CR));        reference_reset_base(href,NR_STACK_POINTER_REG,LA_CR_AIX,4);        list.concat(taicpu.op_reg_ref(A_STW,NR_R0,href));        a_reg_dealloc(list,NR_R0);        (*        { save pointer to incoming arguments }        list.concat(taicpu.op_reg_reg_const(A_ORI,R_31,STACK_POINTER_REG,0));        *)        (*        a_reg_alloc(list,R_12);        { 0 or 8 based on SP alignment }        list.concat(taicpu.op_reg_reg_const_const_const(A_RLWINM,          R_12,STACK_POINTER_REG,0,28,28));        { add in stack length }        list.concat(taicpu.op_reg_reg_const(A_SUBFIC,R_12,R_12,          -localsize));        { establish new alignment }        list.concat(taicpu.op_reg_reg_reg(A_STWUX,STACK_POINTER_REG,STACK_POINTER_REG,R_12));        a_reg_dealloc(list,R_12);        *)        { allocate stack frame }        localsize:= align(localsize + macosLinkageAreaSize + registerSaveAreaSize, 16);        inc(localsize,tg.lasttemp);        localsize:=align(localsize,16);        //tppcprocinfo(current_procinfo).localsize:=localsize;        if (localsize <> 0) then          begin            if (localsize <= high(smallint)) then              begin                reference_reset_base(href,NR_STACK_POINTER_REG,-localsize,8);                a_load_store(list,A_STWU,NR_STACK_POINTER_REG,href);              end            else              begin                reference_reset_base(href,NR_STACK_POINTER_REG,0,8);                href.index := NR_R11;                a_reg_alloc(list,href.index);                a_load_const_reg(list,OS_S32,-localsize,href.index);                a_load_store(list,A_STWUX,NR_STACK_POINTER_REG,href);                a_reg_dealloc(list,href.index);              end;          end;      end;    procedure tcgppc.g_return_from_proc_mac(list : TAsmList;parasize : aint); (* NOT IN USE *)      var        href : treference;      begin        a_reg_alloc(list,NR_R0);        { restore stack pointer }        reference_reset_base(href,NR_STACK_POINTER_REG,LA_SP,4);        list.concat(taicpu.op_reg_ref(A_LWZ,NR_STACK_POINTER_REG,href));        (*        list.concat(taicpu.op_reg_reg_const(A_ORI,NR_STACK_POINTER_REG,R_31,0));        *)        { restore the CR if necessary from callers frame            ( !!! always done currently ) }        reference_reset_base(href,NR_STACK_POINTER_REG,LA_CR_AIX,4);        list.concat(taicpu.op_reg_ref(A_LWZ,NR_R0,href));        list.concat(taicpu.op_reg_reg(A_MTSPR,NR_R0,NR_CR));        a_reg_dealloc(list,NR_R0);        (*        { restore return address from callers frame }        reference_reset_base(href,STACK_POINTER_REG,8);        list.concat(taicpu.op_reg_ref(A_LWZ,R_0,href));        *)        { restore non-volatile registers from callers frame }        restore_regs(list);        (*        { return to caller }        list.concat(taicpu.op_reg_reg(A_MTSPR,R_0,R_LR));        list.concat(taicpu.op_none(A_BLR));        *)        { restore return address from callers frame }        reference_reset_base(href,NR_STACK_POINTER_REG,8,8);        list.concat(taicpu.op_reg_ref(A_LWZ,NR_R0,href));        { return to caller }        list.concat(taicpu.op_reg_reg(A_MTSPR,NR_R0,NR_LR));        list.concat(taicpu.op_none(A_BLR));      end;{ ************* concatcopy ************ }{$ifdef use8byteconcatcopy}  const    maxmoveunit = 8;{$else use8byteconcatcopy}  const    maxmoveunit = 4;{$endif use8byteconcatcopy}    procedure tcgppc.g_concatcopy(list : TAsmList;const source,dest : treference;len : aint);      var        countreg: TRegister;        src, dst: TReference;        lab: tasmlabel;        count, count2: aint;        size: tcgsize;        copyreg: tregister;      begin{$ifdef extdebug}        if len > high(longint) then          internalerror(2002072704);{$endif extdebug}        if (references_equal(source,dest)) then          exit;        { make sure short loads are handled as optimally as possible }        if (len <= maxmoveunit) and           (byte(len) in [1,2,4,8]) then          begin            if len < 8 then              begin                size := int_cgsize(len);                a_load_ref_ref(list,size,size,source,dest);              end            else              begin                copyreg := getfpuregister(list,OS_F64);                a_loadfpu_ref_reg(list,OS_F64,OS_F64,source,copyreg);                a_loadfpu_reg_ref(list,OS_F64,OS_F64,copyreg,dest);              end;            exit;          end;        count := len div maxmoveunit;        reference_reset(src,source.alignment);        reference_reset(dst,dest.alignment);        { load the address of source into src.base }        if (count > 4) or           not issimpleref(source) or           ((source.index <> NR_NO) and            ((source.offset + longint(len)) > high(smallint))) then          begin            src.base := rg[R_INTREGISTER].getregister(list,R_SUBWHOLE);            a_loadaddr_ref_reg(list,source,src.base);          end        else          begin            src := source;          end;        { load the address of dest into dst.base }        if (count > 4) or           not issimpleref(dest) or           ((dest.index <> NR_NO) and            ((dest.offset + longint(len)) > high(smallint))) then          begin            dst.base := rg[R_INTREGISTER].getregister(list,R_SUBWHOLE);            a_loadaddr_ref_reg(list,dest,dst.base);          end        else          begin            dst := dest;          end;{$ifdef use8byteconcatcopy}        if count > 4 then          { generate a loop }          begin            { the offsets are zero after the a_loadaddress_ref_reg and just }            { have to be set to 8. I put an Inc there so debugging may be   }            { easier (should offset be different from zero here, it will be }            { easy to notice in the generated assembler                     }            inc(dst.offset,8);            inc(src.offset,8);            list.concat(taicpu.op_reg_reg_const(A_SUBI,src.base,src.base,8));            list.concat(taicpu.op_reg_reg_const(A_SUBI,dst.base,dst.base,8));            countreg := rg[R_INTREGISTER].getregister(list,R_SUBWHOLE);            a_load_const_reg(list,OS_32,count,countreg);            copyreg := getfpuregister(list,OS_F64);            a_reg_sync(list,copyreg);            current_asmdata.getjumplabel(lab);            a_label(list, lab);            list.concat(taicpu.op_reg_reg_const(A_SUBIC_,countreg,countreg,1));            list.concat(taicpu.op_reg_ref(A_LFDU,copyreg,src));            list.concat(taicpu.op_reg_ref(A_STFDU,copyreg,dst));            a_jmp(list,A_BC,C_NE,0,lab);            a_reg_sync(list,copyreg);            len := len mod 8;          end;        count := len div 8;        if count > 0 then          { unrolled loop }          begin            copyreg := getfpuregister(list,OS_F64);            for count2 := 1 to count do              begin                a_loadfpu_ref_reg(list,OS_F64,OS_F64,src,copyreg);                a_loadfpu_reg_ref(list,OS_F64,OS_F64,copyreg,dst);                inc(src.offset,8);                inc(dst.offset,8);              end;            len := len mod 8;          end;        if (len and 4) <> 0 then          begin            a_reg_alloc(list,NR_R0);            a_load_ref_reg(list,OS_32,OS_32,src,NR_R0);            a_load_reg_ref(list,OS_32,OS_32,NR_R0,dst);            inc(src.offset,4);            inc(dst.offset,4);            a_reg_dealloc(list,NR_R0);          end;{$else use8byteconcatcopy}        if count > 4 then          { generate a loop }          begin            { the offsets are zero after the a_loadaddress_ref_reg and just }            { have to be set to 4. I put an Inc there so debugging may be   }            { easier (should offset be different from zero here, it will be }            { easy to notice in the generated assembler                     }            inc(dst.offset,4);            inc(src.offset,4);            list.concat(taicpu.op_reg_reg_const(A_SUBI,src.base,src.base,4));            list.concat(taicpu.op_reg_reg_const(A_SUBI,dst.base,dst.base,4));            countreg := rg[R_INTREGISTER].getregister(list,R_SUBWHOLE);            a_load_const_reg(list,OS_32,count,countreg);            { explicitely allocate R_0 since it can be used safely here }            { (for holding date that's being copied)                    }            a_reg_alloc(list,NR_R0);            current_asmdata.getjumplabel(lab);            a_label(list, lab);            list.concat(taicpu.op_reg_reg_const(A_SUBIC_,countreg,countreg,1));            list.concat(taicpu.op_reg_ref(A_LWZU,NR_R0,src));            list.concat(taicpu.op_reg_ref(A_STWU,NR_R0,dst));            a_jmp(list,A_BC,C_NE,0,lab);            a_reg_dealloc(list,NR_R0);            len := len mod 4;          end;        count := len div 4;        if count > 0 then          { unrolled loop }          begin            a_reg_alloc(list,NR_R0);            for count2 := 1 to count do              begin                a_load_ref_reg(list,OS_32,OS_32,src,NR_R0);                a_load_reg_ref(list,OS_32,OS_32,NR_R0,dst);                inc(src.offset,4);                inc(dst.offset,4);              end;            a_reg_dealloc(list,NR_R0);            len := len mod 4;          end;{$endif use8byteconcatcopy}       { copy the leftovers }       if (len and 2) <> 0 then         begin           a_reg_alloc(list,NR_R0);           a_load_ref_reg(list,OS_16,OS_16,src,NR_R0);           a_load_reg_ref(list,OS_16,OS_16,NR_R0,dst);           inc(src.offset,2);           inc(dst.offset,2);           a_reg_dealloc(list,NR_R0);         end;       if (len and 1) <> 0 then         begin           a_reg_alloc(list,NR_R0);           a_load_ref_reg(list,OS_8,OS_8,src,NR_R0);           a_load_reg_ref(list,OS_8,OS_8,NR_R0,dst);           a_reg_dealloc(list,NR_R0);         end;      end;{***************** This is private property, keep out! :) *****************}    function tcgppc.issimpleref(const ref: treference): boolean;      begin        if (ref.base = NR_NO) and           (ref.index <> NR_NO) then          internalerror(200208101);        result :=          not(assigned(ref.symbol)) and          (((ref.index = NR_NO) and            (ref.offset >= low(smallint)) and            (ref.offset <= high(smallint))) or           ((ref.index <> NR_NO) and            (ref.offset = 0)));      end;    { find out whether a is of the form 11..00..11b or 00..11...00. If }    { that's the case, we can use rlwinm to do an AND operation        }    function tcgppc.get_rlwi_const(a: aint; var l1, l2: longint): boolean;      var        temp : longint;        testbit : aint;        compare: boolean;      begin        get_rlwi_const := false;        if (a = 0) or (a = -1) then          exit;        { start with the lowest bit }        testbit := 1;        { check its value }        compare := boolean(a and testbit);        { find out how long the run of bits with this value is            }        { (it's impossible that all bits are 1 or 0, because in that case }        { this function wouldn't have been called)                        }        l1 := 31;        while (((a and testbit) <> 0) = compare) do          begin            testbit := testbit shl 1;            dec(l1);          end;        { check the length of the run of bits that comes next }        compare := not compare;        l2 := l1;        while (((a and testbit) <> 0) = compare) and               (l2 >= 0) do          begin            testbit := testbit shl 1;            dec(l2);          end;        { and finally the check whether the rest of the bits all have the }        { same value                                                      }        compare := not compare;        temp := l2;        if temp >= 0 then          if (a shr (31-temp)) <> ((-ord(compare)) shr (31-temp)) then            exit;        { we have done "not(not(compare))", so compare is back to its   }        { initial value. If the lowest bit was 0, a is of the form      }        { 00..11..00 and we need "rlwinm reg,reg,0,l2+1,l1", (+1        }        { because l2 now contains the position of the last zero of the  }        { first run instead of that of the first 1) so switch l1 and l2 }        { in that case (we will generate "rlwinm reg,reg,0,l1,l2")      }        if not compare then          begin            temp := l1;            l1 := l2+1;            l2 := temp;          end        else          { otherwise, l1 currently contains the position of the last   }          { zero instead of that of the first 1 of the second run -> +1 }          inc(l1);        { the following is the same as "if l1 = -1 then l1 := 31;" }        l1 := l1 and 31;        l2 := l2 and 31;        get_rlwi_const := true;      end;    procedure tcg64fppc.a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);      begin        a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);      end;    procedure tcg64fppc.a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);      begin        a_op64_const_reg_reg(list,op,size,value,reg,reg);      end;    procedure tcg64fppc.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);      begin        case op of          OP_AND,OP_OR,OP_XOR:            begin              cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);              cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);            end;          OP_ADD:            begin              list.concat(taicpu.op_reg_reg_reg(A_ADDC,regdst.reglo,regsrc1.reglo,regsrc2.reglo));              list.concat(taicpu.op_reg_reg_reg(A_ADDE,regdst.reghi,regsrc1.reghi,regsrc2.reghi));            end;          OP_SUB:            begin              list.concat(taicpu.op_reg_reg_reg(A_SUBC,regdst.reglo,regsrc2.reglo,regsrc1.reglo));              list.concat(taicpu.op_reg_reg_reg(A_SUBFE,regdst.reghi,regsrc1.reghi,regsrc2.reghi));            end;          else            internalerror(2002072801);        end;      end;    procedure tcg64fppc.a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);      const        ops: array[boolean,1..3] of tasmop = ((A_ADDIC,A_ADDC,A_ADDZE),                                              (A_SUBIC,A_SUBC,A_ADDME));      var        tmpreg: tregister;        tmpreg64: tregister64;        issub: boolean;      begin        case op of          OP_AND,OP_OR,OP_XOR:            begin              cg.a_op_const_reg_reg(list,op,OS_32,aint(value),regsrc.reglo,regdst.reglo);              cg.a_op_const_reg_reg(list,op,OS_32,aint(value shr 32),regsrc.reghi,                regdst.reghi);            end;          OP_ADD, OP_SUB:            begin              if (value < 0) and                 (value <> low(value)) then                begin                  if op = OP_ADD then                    op := OP_SUB                  else                    op := OP_ADD;                  value := -value;                end;              if (longint(value) <> 0) then                begin                  issub := op = OP_SUB;                  if (value > 0) and                     (value-ord(issub) <= 32767) then                    begin                      list.concat(taicpu.op_reg_reg_const(ops[issub,1],                        regdst.reglo,regsrc.reglo,longint(value)));                      list.concat(taicpu.op_reg_reg(ops[issub,3],                        regdst.reghi,regsrc.reghi));                    end                  else if ((value shr 32) = 0) then                    begin                      tmpreg := tcgppc(cg).rg[R_INTREGISTER].getregister(list,R_SUBWHOLE);                      cg.a_load_const_reg(list,OS_32,aint(value),tmpreg);                      list.concat(taicpu.op_reg_reg_reg(ops[issub,2],                        regdst.reglo,regsrc.reglo,tmpreg));                      list.concat(taicpu.op_reg_reg(ops[issub,3],                        regdst.reghi,regsrc.reghi));                    end                  else                    begin                      tmpreg64.reglo := tcgppc(cg).rg[R_INTREGISTER].getregister(list,R_SUBWHOLE);                      tmpreg64.reghi := tcgppc(cg).rg[R_INTREGISTER].getregister(list,R_SUBWHOLE);                      a_load64_const_reg(list,value,tmpreg64);                      a_op64_reg_reg_reg(list,op,size,tmpreg64,regsrc,regdst);                    end                end              else                begin                  cg.a_load_reg_reg(list,OS_INT,OS_INT,regsrc.reglo,regdst.reglo);                  cg.a_op_const_reg_reg(list,op,OS_32,aint(value shr 32),regsrc.reghi,                    regdst.reghi);                end;            end;          else            internalerror(2002072802);        end;      end;begin  cg := tcgppc.create;  cg64 :=tcg64fppc.create;end.
 |