| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892 | {    Copyright (c) 1998-2004 by Jonas Maebe    This unit calls the optimization procedures to optimize the assembler    code for sparc    This program is free software; you can redistribute it and/or modify    it under the terms of the GNU General Public License as published by    the Free Software Foundation; either version 2 of the License, or    (at your option) any later version.    This program is distributed in the hope that it will be useful,    but WITHOUT ANY WARRANTY; without even the implied warranty of    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the    GNU General Public License for more details.    You should have received a copy of the GNU General Public License    along with this program; if not, write to the Free Software    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. ****************************************************************************}unit aoptcpu;{$i fpcdefs.inc}{ $define DEBUG_AOPTCPU}  Interface    uses      cgbase, cpubase, aoptobj, aoptcpub, aopt, aasmtai, aasmcpu;    Type      TAsmOpSet = set of TAsmOp;      TCpuAsmOptimizer = class(TAsmOptimizer)        function RegModifiedByInstruction(Reg: TRegister; p1: tai): boolean; override;        function GetNextInstructionUsingReg(Current: tai;          var Next: tai; reg: TRegister): Boolean;        function TryRemoveMov(var p: tai; opcode: TAsmOp): boolean;        function TryRemoveMovToRefIndex(var p: tai; next: taicpu): boolean;        function TryRemoveMovBeforeStore(var p: tai; next: taicpu; const storeops: TAsmOpSet): boolean;        function PeepHoleOptPass1Cpu(var p: tai): boolean; override;        procedure PeepHoleOptPass2; override;        function RegLoadedWithNewValue(reg : tregister; hp : tai) : boolean; override;        function InstructionLoadsFromReg(const reg : TRegister; const hp : tai) : boolean; override;        { outputs a debug message into the assembler file }        procedure DebugMsg(const s: string; p: tai);      End;  Implementation     uses       cutils,globtype,globals,aasmbase,cpuinfo,verbose;  function MatchInstruction(const instr: tai; const op: TAsmOp): boolean;    begin      result :=        (instr.typ = ait_instruction) and        (taicpu(instr).opcode = op);    end;  function MatchOperand(const oper: TOper; reg: TRegister): boolean;    begin      result:=(oper.typ=top_reg) and (oper.reg=reg);    end;  function IsSameReg(this,next: taicpu): boolean;    begin      result:=(next.oper[0]^.typ=top_reg) and        (next.oper[1]^.typ=top_reg) and        (next.oper[0]^.reg=next.oper[1]^.reg) and        (next.oper[0]^.reg=this.oper[0]^.reg);    end;  function CanBeCMOV(p: tai; condreg: tregister): boolean;    begin      result:=assigned(p) and (p.typ=ait_instruction) and        ((taicpu(p).opcode in [A_MOV_D,A_MOV_S]) or        (          { register with condition must not be overwritten }          (taicpu(p).opcode=A_MOVE) and          (taicpu(p).oper[0]^.reg<>condreg)        ));    end;  procedure ChangeToCMOV(p: taicpu; cond: tasmcond; reg: tregister);    begin      case cond of        C_COP1TRUE:          case p.opcode of            A_MOV_D: p.opcode:=A_MOVT_D;            A_MOV_S: p.opcode:=A_MOVT_S;            A_MOVE:  p.opcode:=A_MOVT;          else            InternalError(2014061701);          end;        C_COP1FALSE:          case p.opcode of            A_MOV_D: p.opcode:=A_MOVF_D;            A_MOV_S: p.opcode:=A_MOVF_S;            A_MOVE:  p.opcode:=A_MOVF;          else            InternalError(2014061702);          end;        C_EQ:          case p.opcode of            A_MOV_D: p.opcode:=A_MOVZ_D;            A_MOV_S: p.opcode:=A_MOVZ_S;            A_MOVE:  p.opcode:=A_MOVZ;          else            InternalError(2014061703);          end;        C_NE:          case p.opcode of            A_MOV_D: p.opcode:=A_MOVN_D;            A_MOV_S: p.opcode:=A_MOVN_S;            A_MOVE:  p.opcode:=A_MOVN;          else            InternalError(2014061704);          end;      else        InternalError(2014061705);      end;      p.ops:=3;      p.loadreg(2,reg);    end;{$ifdef DEBUG_AOPTCPU}  procedure TCpuAsmOptimizer.DebugMsg(const s: string;p : tai);    begin      asml.insertbefore(tai_comment.Create(strpnew(s)), p);    end;{$else DEBUG_AOPTCPU}  procedure TCpuAsmOptimizer.DebugMsg(const s: string;p : tai);inline;    begin    end;{$endif DEBUG_AOPTCPU} function TCpuAsmOptimizer.InstructionLoadsFromReg(const reg: TRegister; const hp: tai): boolean;    var      p: taicpu;      i: longint;    begin      result:=false;      if not (assigned(hp) and (hp.typ=ait_instruction)) then        exit;      p:=taicpu(hp);      i:=0;      while(i<p.ops) do        begin          case p.oper[I]^.typ of            top_reg:              result:=(p.oper[I]^.reg=reg) and (p.spilling_get_operation_type(I)<>operand_write);            top_ref:              result:=                (p.oper[I]^.ref^.base=reg) or                (p.oper[I]^.ref^.index=reg);            else              ;          end;          if result then exit; {Bailout if we found something}          Inc(I);        end;    end;  function TCpuAsmOptimizer.RegLoadedWithNewValue(reg: tregister; hp: tai): boolean;    var      p: taicpu;    begin      p:=taicpu(hp);      result:=false;      if not ((assigned(hp)) and (hp.typ=ait_instruction)) then        exit;      case p.opcode of        { These instructions do not write into a register at all }        A_NOP,        A_C_EQ_D,A_C_EQ_S,A_C_LE_D,A_C_LE_S,A_C_LT_D,A_C_LT_S,        A_BA,A_BC,        A_SB,A_SH,A_SW,A_SWL,A_SWR,A_SWC1,A_SDC1:          exit;        else        ;      end;      result:=(p.ops>0) and (p.oper[0]^.typ=top_reg) and        (p.oper[0]^.reg=reg);    end;  function TCpuAsmOptimizer.RegModifiedByInstruction(Reg: TRegister; p1: tai): boolean;    var      i : Longint;    begin      result:=false;      for i:=0 to taicpu(p1).ops-1 do        if (taicpu(p1).oper[i]^.typ=top_reg) and (taicpu(p1).oper[i]^.reg=Reg) and (taicpu(p1).spilling_get_operation_type(i) in [operand_write,operand_readwrite]) then          begin            result:=true;            exit;          end;    end;  function TCpuAsmOptimizer.GetNextInstructionUsingReg(Current: tai;    var Next: tai; reg: TRegister): Boolean;    begin      Next:=Current;      repeat        Result:=GetNextInstruction(Next,Next);      until {not(cs_opt_level3 in current_settings.optimizerswitches) or} not(Result) or (Next.typ<>ait_instruction) or (RegInInstruction(reg,Next)) or        (is_calljmp(taicpu(Next).opcode));    end;  function TCpuAsmOptimizer.TryRemoveMov(var p: tai; opcode: TAsmOp): boolean;    var      next,hp1: tai;      alloc,dealloc: tai_regalloc;    begin      { Fold          op      $reg1,...          opcode  $reg2,$reg1          dealloc $reg1        into          op   $reg2,...        opcode may be A_MOVE, A_MOV_s, A_MOV_d, etc.      }      result:=false;      if (taicpu(p).ops>0) and         GetNextInstructionUsingReg(p,next,taicpu(p).oper[0]^.reg) and         MatchInstruction(next,opcode) and         MatchOperand(taicpu(next).oper[1]^,taicpu(p).oper[0]^.reg) and         { the destination register of mov cannot be used between p and next }         (not RegUsedBetween(taicpu(next).oper[0]^.reg,p,next)) then        begin          dealloc:=FindRegDealloc(taicpu(p).oper[0]^.reg,tai(next.Next));          if assigned(dealloc) then            begin              { taicpu(p).oper[0]^.reg is not used anymore, try to find its allocation                and remove it if possible }              GetLastInstruction(p,hp1);              asml.Remove(dealloc);              alloc:=FindRegAlloc(taicpu(p).oper[0]^.reg,tai(hp1.Next));              if assigned(alloc) then                begin                  asml.Remove(alloc);                  alloc.free;                  dealloc.free;                end              else                asml.InsertAfter(dealloc,p);              { try to move the allocation of the target register }              GetLastInstruction(next,hp1);              alloc:=FindRegAlloc(taicpu(next).oper[0]^.reg,tai(hp1.Next));              if assigned(alloc) then                begin                  asml.Remove(alloc);                  asml.InsertBefore(alloc,p);                  { adjust used regs }                  IncludeRegInUsedRegs(taicpu(next).oper[0]^.reg,UsedRegs);                end;              { finally get rid of the mov }              taicpu(p).loadreg(0,taicpu(next).oper[0]^.reg);              DebugMsg('Peephole: Move removed 1',next);              asml.remove(next);              next.free;              result:=true;            end          else       // no dealloc found            begin              { try to optimize the typical call sequence                lw  $reg, (whatever)                <alloc volatile registers (including $reg!!)>                move $t9,$reg                jalr $t9                if $reg is nonvolatile, its value may be used after call                 and we cannot safely replace it with $t9 }              if (opcode=A_MOVE) and                 (taicpu(next).oper[0]^.reg=NR_R25) and                 GetNextInstruction(next,hp1) and                 MatchInstruction(hp1,A_JALR) and                 MatchOperand(taicpu(hp1).oper[0]^,NR_R25) and                 assigned(FindRegAlloc(taicpu(p).oper[0]^.reg,tai(p.next))) then                begin                  taicpu(p).loadreg(0,taicpu(next).oper[0]^.reg);                  DebugMsg('Peephole: Move removed 2',next);                  asml.remove(next);                  next.free;                  result:=true;                end;            end;        end;    end;  function TCpuAsmOptimizer.TryRemoveMovBeforeStore(var p: tai; next: taicpu; const storeops: TAsmOpSet): boolean;    begin      result:=(next.opcode in storeops) and        MatchOperand(next.oper[0]^,taicpu(p).oper[0]^.reg) and        { Ry cannot be modified between move and store }        (not RegModifiedBetween(taicpu(p).oper[1]^.reg,p,next)) and        Assigned(FindRegDealloc(taicpu(p).oper[0]^.reg,tai(next.next)));      if result then        begin          next.loadreg(0,taicpu(p).oper[1]^.reg);          DebugMsg('Peephole: Move removed 3',p);          asml.remove(p);          p.free;          p:=next;        end;    end;  function TCpuAsmOptimizer.TryRemoveMovToRefIndex(var p: tai; next: taicpu): boolean;    begin      result:=(next.ops>1) and        (next.oper[1]^.typ=top_ref) and        (next.oper[1]^.ref^.refaddr<>addr_full) and        (next.oper[1]^.ref^.base=taicpu(p).oper[0]^.reg) and        (not RegModifiedBetween(taicpu(p).oper[1]^.reg,p,next)) and        Assigned(FindRegDealloc(taicpu(p).oper[0]^.reg,tai(next.next)));      if result then        begin          next.oper[1]^.ref^.base:=taicpu(p).oper[1]^.reg;          DebugMsg('Peephole: Move removed 4',p);          asml.remove(p);          p.free;          p:=next;        end;    end;  function TCpuAsmOptimizer.PeepHoleOptPass1Cpu(var p: tai): boolean;    var      next,next2: tai;    begin      result:=false;      case p.typ of        ait_instruction:          begin            case taicpu(p).opcode of              A_BC:                begin                  { BEQ/BNE with same register are bogus, but can be generated for code like                   "if lo(qwordvar)=cardinal(qwordvar) ...",                    optimizations below can also yield them, e.g. if one register was initially R0. }                  if (taicpu(p).condition in [C_EQ,C_NE]) and                    (taicpu(p).oper[0]^.reg=taicpu(p).oper[1]^.reg) then                    begin                      if (taicpu(p).condition=C_NE) then                        begin                          if (taicpu(p).oper[2]^.typ = top_ref) and                            (taicpu(p).oper[2]^.ref^.symbol is TAsmLabel) then                            TAsmLabel(taicpu(p).oper[2]^.ref^.symbol).decrefs;                          RemoveDelaySlot(p);                          GetNextInstruction(p,next);                        end                      else                        begin                          next:=taicpu.op_sym(A_BA,taicpu(p).oper[2]^.ref^.symbol);                          taicpu(next).fileinfo:=taicpu(p).fileinfo;                          asml.insertbefore(next,p);                        end;                      asml.remove(p);                      p.Free;                      p:=next;                      result:=true;                    end;                end;              A_SEH:                begin                  if GetNextInstructionUsingReg(p,next,taicpu(p).oper[0]^.reg) and                    MatchInstruction(next,A_SH) and                    MatchOperand(taicpu(next).oper[0]^,taicpu(p).oper[0]^.reg) and                    (not RegUsedBetween(taicpu(p).oper[1]^.reg,p,next)) and                    Assigned(FindRegDealloc(taicpu(p).oper[0]^.reg,tai(next.next))) then                    begin                      taicpu(next).loadreg(0,taicpu(p).oper[1]^.reg);                      asml.remove(p);                      p.free;                      p:=next;                      result:=true;                    end                  else                    result:=TryRemoveMov(p,A_MOVE);                end;              A_SEB:                { TODO: can be handled similar to A_SEH, but it's almost never encountered }                result:=TryRemoveMov(p,A_MOVE);              A_SLL:                begin                  { if this is a sign extension... }                  if (taicpu(p).oper[2]^.typ=top_const) and                    GetNextInstruction(p,next) and                    MatchInstruction(next,A_SRA) and                    IsSameReg(taicpu(p),taicpu(next)) and                    (taicpu(next).oper[2]^.typ=top_const) and                    (taicpu(next).oper[2]^.val=taicpu(p).oper[2]^.val) and                    (taicpu(next).oper[2]^.val=16) and                    { ...followed by 16-bit store (possibly with PIC simplification, etc. in between) }                    GetNextInstructionUsingReg(next,next2,taicpu(p).oper[0]^.reg) and                    MatchInstruction(next2,A_SH) and                    (taicpu(next2).oper[0]^.typ=top_reg) and                    (taicpu(next2).oper[0]^.reg=taicpu(p).oper[0]^.reg) and                    { the initial register may not be reused }                    (not RegUsedBetween(taicpu(p).oper[1]^.reg,next,next2)) then                    begin                      if Assigned(FindRegDealloc(taicpu(p).oper[0]^.reg,tai(next2.next))) then                        begin                          taicpu(next2).loadreg(0,taicpu(p).oper[1]^.reg);                          asml.remove(p);                          asml.remove(next);                          p.free;                          next.free;                          p:=next2;                          result:=true;                        end;                    end                  else                    result:=TryRemoveMov(p,A_MOVE);                end;              A_SRL:                begin                  { TODO: also kill sign-extensions that follow, both SLL+SRA and SEB/SEH versions }                  { Remove 'andi' in sequences                      srl   Rx,Ry,16                      andi  Rx,Rx,65535                      srl   Rx,Ry,24                      andi  Rx,Rx,255                    since 'srl' clears all relevant upper bits }                  if (taicpu(p).oper[2]^.typ=top_const) and                    GetNextInstruction(p,next) and                    MatchInstruction(next,A_ANDI) and                    IsSameReg(taicpu(p),taicpu(next)) and                    (taicpu(next).oper[2]^.typ=top_const) and                    ((                      (taicpu(p).oper[2]^.val>=16) and                      (taicpu(next).oper[2]^.val=65535)                    ) or (                      (taicpu(p).oper[2]^.val>=24) and                      (taicpu(next).oper[2]^.val=255)                    )) then                    begin                      asml.remove(next);                      next.free;                      result:=true;                    end                  else                    result:=TryRemoveMov(p,A_MOVE);                end;              A_ANDI:                begin                  { Remove sign extension after 'andi' if bit 7/15 of const operand is clear }                  if (taicpu(p).oper[2]^.typ=top_const) and                    GetNextInstruction(p,next) and                    MatchInstruction(next,A_SLL) and                    GetNextInstruction(next,next2) and                    MatchInstruction(next2,A_SRA) and                    IsSameReg(taicpu(p),taicpu(next)) and                    IsSameReg(taicpu(p),taicpu(next2)) and                    (taicpu(next).oper[2]^.typ=top_const) and                    (taicpu(next2).oper[2]^.typ=top_const) and                    (taicpu(next).oper[2]^.val=taicpu(next2).oper[2]^.val) and                    ((                      (taicpu(p).oper[2]^.val<=$7fff) and                      (taicpu(next).oper[2]^.val=16)                    ) or (                      (taicpu(p).oper[2]^.val<=$7f) and                      (taicpu(next).oper[2]^.val=24)                    )) then                    begin                      asml.remove(next);                      asml.remove(next2);                      next.free;                      next2.free;                      result:=true;                    end                  { Remove zero extension if register is used only for byte/word memory store }                  else if (taicpu(p).oper[2]^.typ=top_const) and                    GetNextInstruction(p,next) and                    ((taicpu(p).oper[2]^.val=255) and MatchInstruction(next,A_SB)) or                    ((taicpu(p).oper[2]^.val=65535) and MatchInstruction(next,A_SH)) and                    (taicpu(next).oper[0]^.typ=top_reg) and                    (taicpu(next).oper[0]^.reg=taicpu(p).oper[0]^.reg) and                    assigned(FindRegDealloc(taicpu(p).oper[0]^.reg,tai(next.next))) then                    begin                      taicpu(next).loadreg(0,taicpu(p).oper[1]^.reg);                      asml.remove(p);                      p.free;                      p:=next;                      result:=true;                    end                  else                    result:=TryRemoveMov(p,A_MOVE);                end;              A_MOV_S:                begin                  if GetNextInstructionUsingReg(p,next,taicpu(p).oper[0]^.reg) and                     (next.typ=ait_instruction) then                    begin                      if TryRemoveMovBeforeStore(p,taicpu(next),[A_SWC1]) then                        result:=true;                    end;                end;              A_MOV_D:                begin                  if GetNextInstructionUsingReg(p,next,taicpu(p).oper[0]^.reg) and                     (next.typ=ait_instruction) then                    begin                      if TryRemoveMovBeforeStore(p,taicpu(next),[A_SDC1]) then                        result:=true;                    end;                end;              A_MOVE:                begin                  if GetNextInstructionUsingReg(p,next,taicpu(p).oper[0]^.reg) and                    (next.typ=ait_instruction) and                    (not RegModifiedBetween(taicpu(p).oper[1]^.reg,p,next)) then                    begin                      { MOVE  Rx,Ry; store Rx,(ref); dealloc Rx   ==> store Ry,(ref) }                      if TryRemoveMovBeforeStore(p,taicpu(next),[A_SB,A_SH,A_SW]) then                        result:=true                      else if TryRemoveMovToRefIndex(p,taicpu(next)) then                        result:=true                      { MOVE  Rx,Ry; opcode  Rx,Rx,any              ==> opcode Rx,Ry,any                        MOVE  Rx,Ry; opcode  Rx,Rz,Rx               ==> opcode Rx,Rz,Ry   }                      else if (taicpu(next).opcode in [A_ADD,A_ADDU,A_ADDI,A_ADDIU,A_SUB,A_SUBU,A_AND,A_ANDI,A_SLLV,A_SRLV,A_SRAV]) and                         MatchOperand(taicpu(next).oper[0]^,taicpu(p).oper[0]^.reg) then                        begin                          if MatchOperand(taicpu(next).oper[1]^,taicpu(p).oper[0]^.reg) then                            begin                              taicpu(next).loadreg(1,taicpu(p).oper[1]^.reg);                              asml.remove(p);                              p.free;                              p:=next;                              result:=true;                            end                          { TODO: if Ry=NR_R0, this effectively changes instruction into MOVE,                            providing further optimization possibilities }                          else if MatchOperand(taicpu(next).oper[2]^,taicpu(p).oper[0]^.reg) then                            begin                              taicpu(next).loadreg(2,taicpu(p).oper[1]^.reg);                              asml.remove(p);                              p.free;                              p:=next;                              result:=true;                            end;                        end                      { MOVE  Rx,Ry; opcode Rz,Rx,any; dealloc Rx  ==> opcode Rz,Ry,any }                      else if (taicpu(next).opcode in [A_ADD,A_ADDU,A_ADDI,A_ADDIU,A_SUB,A_SUBU,A_SLT,A_SLTU,A_DIV,A_DIVU,                                                       A_SLL,A_SRL,A_SRA,A_SLLV,A_SRLV,A_SRAV,A_AND,A_ANDI,A_OR,A_ORI,A_XOR,A_XORI]) and                         Assigned(FindRegDealloc(taicpu(p).oper[0]^.reg,tai(next.next))) then                        begin                          if MatchOperand(taicpu(next).oper[1]^,taicpu(p).oper[0]^.reg) then                            begin                              taicpu(next).loadreg(1,taicpu(p).oper[1]^.reg);                              asml.remove(p);                              p.free;                              p:=next;                              result:=true;                            end                          else if MatchOperand(taicpu(next).oper[2]^,taicpu(p).oper[0]^.reg) then                            begin                              taicpu(next).loadreg(2,taicpu(p).oper[1]^.reg);                              asml.remove(p);                              p.free;                              p:=next;                              result:=true;                            end;                        end                      { MULT[U] and cond.branches must be handled separately due to different operand numbers }                      else if (taicpu(next).opcode in [A_MULT,A_MULTU,A_BC]) and                         Assigned(FindRegDealloc(taicpu(p).oper[0]^.reg,tai(next.next))) then                        begin                          if MatchOperand(taicpu(next).oper[0]^,taicpu(p).oper[0]^.reg) then                            begin                              taicpu(next).loadreg(0,taicpu(p).oper[1]^.reg);                              if MatchOperand(taicpu(next).oper[1]^,taicpu(p).oper[0]^.reg) then                                taicpu(next).loadreg(1,taicpu(p).oper[1]^.reg);                              asml.remove(p);                              p.free;                              p:=next;                              result:=true;                            end                          else if MatchOperand(taicpu(next).oper[1]^,taicpu(p).oper[0]^.reg) then                            begin                              taicpu(next).loadreg(1,taicpu(p).oper[1]^.reg);                              if MatchOperand(taicpu(next).oper[0]^,taicpu(p).oper[0]^.reg) then                                taicpu(next).loadreg(0,taicpu(p).oper[1]^.reg);                              asml.remove(p);                              p.free;                              p:=next;                              result:=true;                            end;                        end                      else if TryRemoveMov(p,A_MOVE) then                        begin                          { Ended up with move between same register? Suicide then. }                          if (taicpu(p).oper[0]^.reg=taicpu(p).oper[1]^.reg) then                            begin                              GetNextInstruction(p,next);                              asml.remove(p);                              p.free;                              p:=next;                              result:=true;                            end;                        end;                    end;                end;              A_ADDIU:                begin                  { ADDIU  Rx,Ry,const;    load/store  Rz,(Rx); dealloc Rx  ==> load/store Rz,const(Ry)                    ADDIU  Rx,Ry,%lo(sym); load/store  Rz,(Rx); dealloc Rx  ==> load/store Rz,%lo(sym)(Ry)                    ADDIU  Rx,Ry,const;    load Rx,(Rx)                     ==> load Rx,const(Ry)                    ADDIU  Rx,Ry,%lo(sym); load Rx,(Rx)                     ==> load Rx,%lo(sym)(Ry)    }                  if GetNextInstructionUsingReg(p,next,taicpu(p).oper[0]^.reg) and                    (next.typ=ait_instruction) and                    (taicpu(next).opcode in [A_LB,A_LBU,A_LH,A_LHU,A_LW,A_SB,A_SH,A_SW]) and                    (taicpu(p).oper[0]^.reg=taicpu(next).oper[1]^.ref^.base) and                    (taicpu(next).oper[1]^.ref^.offset=0) and                    (taicpu(next).oper[1]^.ref^.symbol=nil) and                    (                      Assigned(FindRegDealloc(taicpu(p).oper[0]^.reg,tai(next.next))) or                      (                        (taicpu(p).oper[0]^.reg=taicpu(next).oper[0]^.reg) and                        (taicpu(next).opcode in [A_LB,A_LBU,A_LH,A_LHU,A_LW])                      )                    )  and                    (not RegModifiedBetween(taicpu(p).oper[1]^.reg,p,next)) then                    begin                      case taicpu(p).oper[2]^.typ of                        top_const:                          taicpu(next).oper[1]^.ref^.offset:=taicpu(p).oper[2]^.val;                        top_ref:                          taicpu(next).oper[1]^.ref^:=taicpu(p).oper[2]^.ref^;                      else                        InternalError(2014100401);                      end;                      taicpu(next).oper[1]^.ref^.base:=taicpu(p).oper[1]^.reg;                      asml.remove(p);                      p.free;                      p:=next;                      result:=true;                    end                  else                    result:=TryRemoveMov(p,A_MOVE);                end;              A_ADD,A_ADDU,A_OR:                begin                  if MatchOperand(taicpu(p).oper[1]^,NR_R0) then                    begin                      taicpu(p).freeop(1);                      taicpu(p).oper[1]:=taicpu(p).oper[2];                      taicpu(p).oper[2]:=nil;                      taicpu(p).ops:=2;                      taicpu(p).opercnt:=2;                      taicpu(p).opcode:=A_MOVE;                      result:=true;                    end                  else if MatchOperand(taicpu(p).oper[2]^,NR_R0) then                    begin                      taicpu(p).freeop(2);                      taicpu(p).ops:=2;                      taicpu(p).opercnt:=2;                      taicpu(p).opcode:=A_MOVE;                      result:=true;                    end                  else                    result:=TryRemoveMov(p,A_MOVE);                end;              A_LB,A_LBU,A_LH,A_LHU,A_LW,              A_ADDI,              A_SUB,A_SUBU,              A_SRA,A_SRAV,              A_SRLV,              A_SLLV,              A_MFLO,A_MFHI,              A_AND,A_XOR,A_ORI,A_XORI:                result:=TryRemoveMov(p,A_MOVE);              A_LWC1,              A_ADD_s, A_SUB_s, A_MUL_s, A_DIV_s,              A_ABS_s, A_NEG_s, A_SQRT_s,              A_CVT_s_w, A_CVT_s_l, A_CVT_s_d:                result:=TryRemoveMov(p,A_MOV_s);              A_LDC1,              A_ADD_d, A_SUB_d, A_MUL_d, A_DIV_d,              A_ABS_d, A_NEG_d, A_SQRT_d,              A_CVT_d_w, A_CVT_d_l, A_CVT_d_s:                result:=TryRemoveMov(p,A_MOV_d);              else                ;            end;          end;        else          ;      end;    end;  procedure TCpuAsmOptimizer.PeepHoleOptPass2;    var      p: tai;      l: longint;      hp1,hp2,hp3: tai;      condition: tasmcond;      condreg: tregister;    begin      { Currently, everything below is mips4+ }      if (current_settings.cputype<cpu_mips4) then        exit;      p:=BlockStart;      ClearUsedRegs;      while (p<>BlockEnd) Do        begin          UpdateUsedRegs(tai(p.next));          case p.typ of            ait_instruction:              begin                case taicpu(p).opcode of                  A_BC:                    begin                      condreg:=NR_NO;                      if (taicpu(p).condition in [C_COP1TRUE,C_COP1FALSE]) then                        { TODO: must be taken from "p" if/when codegen makes use of multiple %fcc }                        condreg:=NR_FCC0                      else if (taicpu(p).condition in [C_EQ,C_NE]) then                        begin                          if (taicpu(p).oper[0]^.reg=NR_R0) then                            condreg:=taicpu(p).oper[1]^.reg                          else if (taicpu(p).oper[1]^.reg=NR_R0) then                            condreg:=taicpu(p).oper[0]^.reg                        end;                      if (condreg<>NR_NO) then                        begin                          { check for                              bCC   xxx                              <several movs>                          xxx:                          }                          l:=0;                          GetNextInstruction(p, hp1);                          while CanBeCMOV(hp1,condreg) do       // CanBeCMOV returns False for nil or labels                            begin                              inc(l);                              GetNextInstruction(hp1,hp1);                            end;                          if assigned(hp1) then                            begin                              if FindLabel(tasmlabel(taicpu(p).oper[taicpu(p).ops-1]^.ref^.symbol),hp1) then                                begin                                  if (l<=4) and (l>0) then                                    begin                                      condition:=inverse_cond(taicpu(p).condition);                                      hp2:=p;                                      GetNextInstruction(p,hp1);                                      p:=hp1;                                      repeat                                        ChangeToCMOV(taicpu(hp1),condition,condreg);                                        GetNextInstruction(hp1,hp1);                                      until not CanBeCMOV(hp1,condreg);                                      { wait with removing else GetNextInstruction could                                        ignore the label if it was the only usage in the                                        jump moved away }                                      tasmlabel(taicpu(hp2).oper[taicpu(hp2).ops-1]^.ref^.symbol).decrefs;                                      RemoveDelaySlot(hp2);                                      asml.remove(hp2);                                      hp2.free;                                      continue;                                    end;                                end                              else                                begin                                  { check further for                                        bCC   xxx                                        <several movs 1>                                        b     yyy                                    xxx:                                        <several movs 2>                                    yyy:                                  }                                  { hp2 points to jmp yyy }                                  hp2:=hp1;                                  { skip hp1 to xxx }                                  GetNextInstruction(hp1, hp1);                                  if assigned(hp2) and                                    assigned(hp1) and                                    (l<=3) and                                    (hp2.typ=ait_instruction) and                                    (taicpu(hp2).opcode=A_BA) and                                    { real label and jump, no further references to the                                      label are allowed }                                    (tasmlabel(taicpu(p).oper[taicpu(p).ops-1]^.ref^.symbol).getrefs<=2) and                                    FindLabel(tasmlabel(taicpu(p).oper[taicpu(p).ops-1]^.ref^.symbol),hp1) then                                    begin                                      l:=0;                                      { skip hp1 to <several moves 2> }                                      GetNextInstruction(hp1, hp1);                                      while CanBeCMOV(hp1,condreg) do                                        begin                                          inc(l);                                          GetNextInstruction(hp1, hp1);                                        end;                                      { hp1 points to yyy: }                                      if assigned(hp1) and (l<=3) and                                        FindLabel(tasmlabel(taicpu(hp2).oper[taicpu(hp2).ops-1]^.ref^.symbol),hp1) then                                        begin                                          condition:=inverse_cond(taicpu(p).condition);                                          GetNextInstruction(p,hp1);                                          hp3:=p;                                          p:=hp1;                                          while CanBeCMOV(hp1,condreg) do                                            begin                                              ChangeToCMOV(taicpu(hp1),condition,condreg);                                              GetNextInstruction(hp1,hp1);                                            end;                                          { hp2 is still at b yyy }                                          GetNextInstruction(hp2,hp1);                                          { hp2 is now at xxx: }                                          condition:=inverse_cond(condition);                                          GetNextInstruction(hp1,hp1);                                          { hp1 is now at <several movs 2> }                                          while CanBeCMOV(hp1,condreg) do                                            begin                                              ChangeToCMOV(taicpu(hp1),condition,condreg);                                              GetNextInstruction(hp1,hp1);                                            end;                                          { remove bCC }                                          tasmlabel(taicpu(hp3).oper[taicpu(hp3).ops-1]^.ref^.symbol).decrefs;                                          RemoveDelaySlot(hp3);                                          asml.remove(hp3);                                          hp3.free;                                          { remove jmp }                                          tasmlabel(taicpu(hp2).oper[taicpu(hp2).ops-1]^.ref^.symbol).decrefs;                                          RemoveDelaySlot(hp2);                                          asml.remove(hp2);                                          hp2.free;                                          continue;                                        end;                                    end;                                end;                            end;                        end;                    end;                  else                    ;                end;              end;            else              ;          end;          UpdateUsedRegs(p);          p:=tai(p.next);        end;    end;begin  casmoptimizer:=TCpuAsmOptimizer;end.
 |