| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701 | {    Copyright (c) 1998-2004 by Jonas Maebe    This unit calls the optimization procedures to optimize the assembler    code for sparc    This program is free software; you can redistribute it and/or modify    it under the terms of the GNU General Public License as published by    the Free Software Foundation; either version 2 of the License, or    (at your option) any later version.    This program is distributed in the hope that it will be useful,    but WITHOUT ANY WARRANTY; without even the implied warranty of    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the    GNU General Public License for more details.    You should have received a copy of the GNU General Public License    along with this program; if not, write to the Free Software    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. ****************************************************************************}unit aoptcpu;{$i fpcdefs.inc}interfaceuses cpubase, aasmtai, aopt, aoptcpub;type  TCpuAsmOptimizer = class(TAsmOptimizer)    function PeepHoleOptPass1Cpu(var p: tai): boolean; override;  end;implementationuses  globtype, globals,  cutils,  verbose,  cgbase, cgutils,  aoptobj,  aasmbase, aasmdata, aasmcpu,  itcpugas;function isFoldableArithOp(hp1: taicpu; reg: tregister): boolean;begin  isFoldableArithOp := False;  case hp1.opcode of    A_ADD, A_SUB, A_OR, A_XOR, A_AND, A_SHL, A_SHR, A_SAR:      isFoldableArithOp :=        (taicpu(hp1).oper[1]^.typ = top_reg) and        (taicpu(hp1).oper[1]^.reg = reg) and        ((taicpu(hp1).oper[0]^.typ = top_const) or        ((taicpu(hp1).oper[0]^.typ = top_reg) and        (taicpu(hp1).oper[0]^.reg<>reg)));    A_INC, A_DEC:      isFoldableArithOp :=        (taicpu(hp1).oper[0]^.typ = top_reg) and        (taicpu(hp1).oper[0]^.reg = reg);    end;end;function MatchInstruction(const instr: tai; const op: TAsmOp; const opsize: topsizes): boolean;  begin    result :=      (instr.typ = ait_instruction) and      (taicpu(instr).opcode = op) and      ((opsize = []) or (taicpu(instr).opsize in opsize));  end;function MatchInstruction(const instr: tai; const op1,op2: TAsmOp; const opsize: topsizes): boolean;  begin    result :=      (instr.typ = ait_instruction) and      ((taicpu(instr).opcode = op1) or       (taicpu(instr).opcode = op2)      ) and      ((opsize = []) or (taicpu(instr).opsize in opsize));  end;function MatchInstruction(const instr: tai; const op1,op2,op3: TAsmOp; const opsize: topsizes): boolean;  begin    result :=      (instr.typ = ait_instruction) and      ((taicpu(instr).opcode = op1) or       (taicpu(instr).opcode = op2) or       (taicpu(instr).opcode = op3)      ) and      ((opsize = []) or (taicpu(instr).opsize in opsize));  end;function MatchOperand(const oper: TOper; const reg: TRegister): boolean; inline;  begin    result := (oper.typ = top_reg) and (oper.reg = reg);  end;function MatchOperand(const oper: TOper; const a: tcgint): boolean; inline;  begin    result := (oper.typ = top_const) and (oper.val = a);  end;function refsequal(const r1, r2: treference): boolean;  begin    refsequal :=      (r1.offset = r2.offset) and      (r1.segment = r2.segment) and (r1.base = r2.base) and      (r1.index = r2.index) and (r1.scalefactor = r2.scalefactor) and      (r1.symbol=r2.symbol) and (r1.refaddr = r2.refaddr) and      (r1.relsymbol = r2.relsymbol);  end;function MatchOperand(const oper1: TOper; const oper2: TOper): boolean; inline;  begin    result := oper1.typ = oper2.typ;    if result then      case oper1.typ of        top_const:          Result:=oper1.val = oper2.val;        top_reg:          Result:=oper1.reg = oper2.reg;        top_ref:          Result:=RefsEqual(oper1.ref^, oper2.ref^);        else          internalerror(2013102801);      end  end;function MatchReference(const ref : treference;base,index : TRegister) : Boolean;  begin   Result:=(ref.offset=0) and     (ref.scalefactor in [0,1]) and     (ref.segment=NR_NO) and     (ref.symbol=nil) and     (ref.relsymbol=nil) and     ((base=NR_INVALID) or      (ref.base=base)) and     ((index=NR_INVALID) or      (ref.index=index));  end;function TCpuAsmOptimizer.PeepHoleOptPass1Cpu(var p: tai): boolean;var  next1: tai;  hp1, hp2: tai;  GetNextIntruction_p : boolean;  TmpUsedRegs : TAllUsedRegs;begin  Result := False;  case p.typ of    ait_instruction:      begin      case taicpu(p).opcode of        A_AND:          begin          if (taicpu(p).oper[0]^.typ = top_const) and            (taicpu(p).oper[1]^.typ = top_reg) and            GetNextInstruction(p, hp1) and            (tai(hp1).typ = ait_instruction) and            (taicpu(hp1).opcode = A_AND) and            (taicpu(hp1).oper[0]^.typ = top_const) and            (taicpu(hp1).oper[1]^.typ = top_reg) and            (getsupreg(taicpu(p).oper[1]^.reg) = getsupreg(            taicpu(hp1).oper[1]^.reg)) and            (getsubreg(taicpu(p).oper[1]^.reg)<=getsubreg(            taicpu(hp1).oper[1]^.reg)) and            (abs(taicpu(p).oper[0]^.val and             taicpu(hp1).oper[0]^.val)<$80000000) then            {change "and const1, reg; and const2, reg" to "and (const1 and const2), reg"}            begin              taicpu(hp1).loadConst(0, taicpu(p).oper[0]^.val and                taicpu(hp1).oper[0]^.val);              if (cs_asm_source in current_settings.globalswitches) then                asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var1')),p);              asml.remove(p);              p.Free;              p:=hp1;            end          else if (taicpu(p).oper[0]^.typ = top_const) and            (taicpu(p).oper[1]^.typ = top_reg) and            GetNextInstruction(p, hp1) and            MatchInstruction(hp1,A_MOVZX,[]) and            (taicpu(hp1).oper[0]^.typ = top_reg) and            MatchOperand(taicpu(p).oper[1]^,taicpu(hp1).oper[1]^) and            (getsubreg(taicpu(hp1).oper[0]^.reg)=getsubreg(taicpu(hp1).oper[1]^.reg)) and             (((taicpu(p).opsize=S_W) and               (taicpu(hp1).opsize=S_BW)) or              ((taicpu(p).opsize=S_L) and               (taicpu(hp1).opsize in [S_WL,S_BL])) or               ((taicpu(p).opsize=S_Q) and               (taicpu(hp1).opsize in [S_BQ,S_WQ,S_LQ]))              ) then                begin                  if (((taicpu(hp1).opsize) in [S_BW,S_BL,S_BQ]) and                      ((taicpu(p).oper[0]^.val and $ff)=taicpu(p).oper[0]^.val)) or                     (((taicpu(hp1).opsize) in [S_WL,S_WQ]) and                      ((taicpu(p).oper[0]^.val and $ffff)=taicpu(p).oper[0]^.val)) or                     (((taicpu(hp1).opsize)=S_LQ) and                      ((taicpu(p).oper[0]^.val and $ffffffff)=taicpu(p).oper[0]^.val)                     ) then                     begin                       if (cs_asm_source in current_settings.globalswitches) then                         asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,AndMovzToAnd')),p);                       asml.remove(hp1);                       hp1.free;                     end;                end          else if (taicpu(p).oper[0]^.typ = top_const) and            (taicpu(p).oper[1]^.typ = top_reg) and            GetNextInstruction(p, hp1) and            MatchInstruction(hp1,A_MOVSX,A_MOVSXD,[]) and            (taicpu(hp1).oper[0]^.typ = top_reg) and            MatchOperand(taicpu(p).oper[1]^,taicpu(hp1).oper[1]^) and            (getsupreg(taicpu(hp1).oper[0]^.reg)=getsupreg(taicpu(hp1).oper[1]^.reg)) and             (((taicpu(p).opsize=S_W) and               (taicpu(hp1).opsize=S_BW)) or              ((taicpu(p).opsize=S_L) and               (taicpu(hp1).opsize in [S_WL,S_BL])) or               ((taicpu(p).opsize=S_Q) and               (taicpu(hp1).opsize in [S_BQ,S_WQ,S_LQ]))              ) then                begin                  if (((taicpu(hp1).opsize) in [S_BW,S_BL,S_BQ]) and                      ((taicpu(p).oper[0]^.val and $7f)=taicpu(p).oper[0]^.val)) or                     (((taicpu(hp1).opsize) in [S_WL,S_WQ]) and                      ((taicpu(p).oper[0]^.val and $7fff)=taicpu(p).oper[0]^.val)) or                     (((taicpu(hp1).opsize)=S_LQ) and                      ((taicpu(p).oper[0]^.val and $7fffffff)=taicpu(p).oper[0]^.val)                     ) then                     begin                       if (cs_asm_source in current_settings.globalswitches) then                         asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,AndMovsxToAnd')),p);                       asml.remove(hp1);                       hp1.free;                     end;                end;(*                      else  {change "and x, reg; jxx" to "test x, reg", if reg is deallocated before the  jump, but only if it's a conditional jump (PFV) }                      if (taicpu(p).oper[1]^.typ = top_reg) and                         GetNextInstruction(p, hp1) and                         (hp1.typ = ait_instruction) and                         (taicpu(hp1).is_jmp) and                         (taicpu(hp1).opcode<>A_JMP) and                         not(getsupreg(taicpu(p).oper[1]^.reg) in UsedRegs) then                        taicpu(p).opcode := A_TEST;*)          end;        A_MOV:        { removes superfluous And's after mov's }          begin            if not(cs_opt_level3 in current_settings.optimizerswitches) then              exit;            GetNextIntruction_p:=GetNextInstruction(p, hp1);            if (taicpu(p).oper[1]^.typ = top_reg) and               GetNextIntruction_p and               (tai(hp1).typ = ait_instruction) and               (taicpu(hp1).opcode = A_AND) and               (taicpu(hp1).oper[0]^.typ = top_const) and               (taicpu(hp1).oper[1]^.typ = top_reg) and               (taicpu(hp1).oper[1]^.reg = taicpu(p).oper[1]^.reg) then              case taicpu(p).opsize Of                S_L:                  if (taicpu(hp1).oper[0]^.val = $ffffffff) then                    begin                      if (cs_asm_source in current_settings.globalswitches) then                        asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var2a')),p);                      asml.remove(hp1);                      hp1.free;                    end;              end            { Next instruction is also a MOV ? }            else if GetNextIntruction_p and              MatchInstruction(hp1,A_MOV,[taicpu(p).opsize]) then              begin                if (taicpu(hp1).oper[0]^.typ = taicpu(p).oper[1]^.typ) and                   (taicpu(hp1).oper[1]^.typ = taicpu(p).oper[0]^.typ) then                    {mov reg1, mem1     or     mov mem1, reg1                     mov mem2, reg2            mov reg2, mem2}                  begin                    if OpsEqual(taicpu(hp1).oper[1]^,taicpu(p).oper[0]^) then                      {mov reg1, mem1     or     mov mem1, reg1                       mov mem2, reg1            mov reg2, mem1}                      begin                        if OpsEqual(taicpu(hp1).oper[0]^,taicpu(p).oper[1]^) then                          { Removes the second statement from                            mov reg1, mem1/reg2                            mov mem1/reg2, reg1 }                          begin                            { if (taicpu(p).oper[0]^.typ = top_reg) then                              AllocRegBetween(asmL,taicpu(p).oper[0]^.reg,p,hp1,usedregs); }                            if (cs_asm_source in current_settings.globalswitches) then                              asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,MovMov2Mov1')),p);                            asml.remove(hp1);                            hp1.free;                          end;                      end                    else if (taicpu(p).oper[1]^.typ=top_ref) and                      OpsEqual(taicpu(hp1).oper[0]^,taicpu(p).oper[1]^) then                      begin                        taicpu(hp1).loadreg(0,taicpu(p).oper[0]^.reg);                        if (cs_asm_source in current_settings.globalswitches) then                          asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,MovMov2MovMov1')),p);                      end;                  end              end            else if (taicpu(p).oper[1]^.typ = top_reg) and              GetNextIntruction_p and              (hp1.typ = ait_instruction) and              GetNextInstruction(hp1, hp2) and              (hp2.typ = ait_instruction) and              (taicpu(hp2).opcode = A_MOV) and              (taicpu(hp2).oper[0]^.typ = top_reg) and              OpsEqual(taicpu(hp2).oper[1]^, taicpu(p).oper[0]^) and              (IsFoldableArithOp(taicpu(hp1), taicpu(p).oper[1]^.reg) or               ((taicpu(p).opsize=S_L) and (taicpu(hp1).opsize=S_Q) and                IsFoldableArithOp(taicpu(hp1), newreg(R_INTREGISTER,getsupreg(taicpu(p).oper[1]^.reg),R_SUBQ)))              ) then              { change   movsX/movzX    reg/ref, reg2             }              {          add/sub/or/... reg3/$const, reg2         }              {          mov            reg2 reg/ref              }              { to       add/sub/or/... reg3/$const, reg/ref      }              begin                CopyUsedRegs(TmpUsedRegs);                UpdateUsedRegs(TmpUsedRegs, tai(p.next));                UpdateUsedRegs(TmpUsedRegs, tai(hp1.next));                If not(RegUsedAfterInstruction(taicpu(p).oper[1]^.reg,hp2,TmpUsedRegs)) then                  begin                    { by example:                        movswl  %si,%eax        movswl  %si,%eax      p                        decl    %eax            addl    %edx,%eax     hp1                        movw    %ax,%si         movw    %ax,%si       hp2                      ->                        movswl  %si,%eax        movswl  %si,%eax      p                        decw    %eax            addw    %edx,%eax     hp1                        movw    %ax,%si         movw    %ax,%si       hp2                    }                    if (cs_asm_source in current_settings.globalswitches) then                      begin                        asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var2')),p);                        asml.insertbefore(tai_comment.create(strpnew('P='+std_op2str[taicpu(p).opcode]+gas_opsize2str[taicpu(p).opsize])),p);                        asml.insertbefore(tai_comment.create(strpnew('HP1='+std_op2str[taicpu(hp1).opcode]+gas_opsize2str[taicpu(hp1).opsize])),p);                        asml.insertbefore(tai_comment.create(strpnew('HP2='+std_op2str[taicpu(hp2).opcode]+gas_opsize2str[taicpu(hp2).opsize])),p);                     end;                    taicpu(hp1).changeopsize(taicpu(p).opsize);                    {                      ->                        movswl  %si,%eax        movswl  %si,%eax      p                        decw    %si             addw    %dx,%si       hp1                        movw    %ax,%si         movw    %ax,%si       hp2                    }                    case taicpu(hp1).ops of                      1:                        begin                          taicpu(hp1).loadoper(0, taicpu(hp2).oper[1]^);                          if taicpu(hp1).oper[0]^.typ=top_reg then                            setsubreg(taicpu(hp1).oper[0]^.reg,getsubreg(taicpu(p).oper[1]^.reg));                        end;                      2:                        begin                          taicpu(hp1).loadoper(1, taicpu(hp2).oper[1]^);                          if (taicpu(hp1).oper[0]^.typ=top_reg) and                            (taicpu(hp1).opcode<>A_SHL) and                            (taicpu(hp1).opcode<>A_SHR) and                            (taicpu(hp1).opcode<>A_SAR) then                            setsubreg(taicpu(hp1).oper[0]^.reg,getsubreg(taicpu(p).oper[1]^.reg));                        end;                      else                        internalerror(2008042701);                    end;                    {                      ->                        decw    %si             addw    %dx,%si       p                    }                    if (cs_asm_source in current_settings.globalswitches) then                      asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var2')),p);                    asml.remove(p);                    asml.remove(hp2);                    p.Free;                    hp2.Free;                    p := hp1;                 end;                ReleaseUsedRegs(TmpUsedRegs);              end          end;        A_MOVSX,        A_MOVZX:          begin          if (taicpu(p).oper[1]^.typ = top_reg) and            GetNextInstruction(p, hp1) and            (hp1.typ = ait_instruction) and            IsFoldableArithOp(taicpu(hp1), taicpu(p).oper[1]^.reg) and            GetNextInstruction(hp1, hp2) and            (hp2.typ = ait_instruction) and            (taicpu(hp2).opcode = A_MOV) and            (taicpu(hp2).oper[0]^.typ = top_reg) and            OpsEqual(taicpu(hp2).oper[1]^, taicpu(p).oper[0]^) then            { change   movsX/movzX    reg/ref, reg2             }            {          add/sub/or/... reg3/$const, reg2         }            {          mov            reg2 reg/ref              }            { to       add/sub/or/... reg3/$const, reg/ref      }            begin              { by example:                  movswl  %si,%eax        movswl  %si,%eax      p                  decl    %eax            addl    %edx,%eax     hp1                  movw    %ax,%si         movw    %ax,%si       hp2                ->                  movswl  %si,%eax        movswl  %si,%eax      p                  decw    %eax            addw    %edx,%eax     hp1                  movw    %ax,%si         movw    %ax,%si       hp2              }              taicpu(hp1).changeopsize(taicpu(hp2).opsize);              {                ->                  movswl  %si,%eax        movswl  %si,%eax      p                  decw    %si             addw    %dx,%si       hp1                  movw    %ax,%si         movw    %ax,%si       hp2              }              case taicpu(hp1).ops of                1:                  taicpu(hp1).loadoper(0, taicpu(hp2).oper[1]^);                2:                  begin                    taicpu(hp1).loadoper(1, taicpu(hp2).oper[1]^);                    if (taicpu(hp1).oper[0]^.typ = top_reg) then                      setsubreg(taicpu(hp1).oper[0]^.reg,                        getsubreg(taicpu(hp2).oper[0]^.reg));                  end;                else                  internalerror(2008042701);              end;              {                ->                  decw    %si             addw    %dx,%si       p              }              if (cs_asm_source in current_settings.globalswitches) then                asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var3')),p);              asml.remove(p);              asml.remove(hp2);              p.Free;              hp2.Free;              p := hp1;            end          { removes superfluous And's after movzx's }          else if taicpu(p).opcode = A_MOVZX then            begin            if (taicpu(p).oper[1]^.typ = top_reg) and              GetNextInstruction(p, hp1) and              (tai(hp1).typ = ait_instruction) and              (taicpu(hp1).opcode = A_AND) and              (taicpu(hp1).oper[0]^.typ = top_const) and              (taicpu(hp1).oper[1]^.typ = top_reg) and              (taicpu(hp1).oper[1]^.reg = taicpu(p).oper[1]^.reg) then                begin                  case taicpu(p).opsize of                    S_BL, S_BW, S_BQ:                      if (taicpu(hp1).oper[0]^.val = $ff) then                        begin                          if (cs_asm_source in current_settings.globalswitches) then                            asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var4')),p);                          asml.remove(hp1);                          hp1.Free;                        end;                    S_WL, S_WQ:                      if (taicpu(hp1).oper[0]^.val = $ffff) then                        begin                          if (cs_asm_source in current_settings.globalswitches) then                            asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var5')),p);                          asml.remove(hp1);                          hp1.Free;                        end;                    S_LQ:                      if (taicpu(hp1).oper[0]^.val = $ffffffff) then                        begin                          if (cs_asm_source in current_settings.globalswitches) then                            asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var6')),p);                          asml.remove(hp1);                          hp1.Free;                        end;                    end;               end;            { changes some movzx constructs to faster synonims (all examples              are given with eax/ax, but are also valid for other registers)}            if (taicpu(p).oper[1]^.typ = top_reg) then              if (taicpu(p).oper[0]^.typ = top_reg) then                case taicpu(p).opsize of                  S_BW:                    begin                    if (getsupreg(taicpu(p).oper[0]^.reg) =                      getsupreg(taicpu(p).oper[1]^.reg)) and  not                      (cs_opt_size in current_settings.optimizerswitches) then                      {Change "movzbw %al, %ax" to "andw $0x0ffh, %ax"}                      begin                      taicpu(p).opcode := A_AND;                      taicpu(p).changeopsize(S_W);                      taicpu(p).loadConst(0, $ff);                      if (cs_asm_source in current_settings.globalswitches) then                        asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var7')),p);                      end                    else if GetNextInstruction(p, hp1) and                      (tai(hp1).typ = ait_instruction) and                      (taicpu(hp1).opcode = A_AND) and                      (taicpu(hp1).oper[0]^.typ = top_const) and                      (taicpu(hp1).oper[1]^.typ = top_reg) and                      (taicpu(hp1).oper[1]^.reg =                      taicpu(p).oper[1]^.reg) then                      { Change "movzbw %reg1, %reg2; andw $const, %reg2"                        to "movw %reg1, reg2; andw $(const1 and $ff), %reg2"}                      begin                        if (cs_asm_source in current_settings.globalswitches) then                          asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var8')),p);                        taicpu(p).opcode := A_MOV;                        taicpu(p).changeopsize(S_W);                        setsubreg(taicpu(p).oper[0]^.reg, R_SUBW);                        taicpu(hp1).loadConst(                          0, taicpu(hp1).oper[0]^.val and $ff);                      end;                    end;                  S_BL:                    begin                    if (getsupreg(taicpu(p).oper[0]^.reg) =                      getsupreg(taicpu(p).oper[1]^.reg)) and not                      (cs_opt_size in current_settings.optimizerswitches) then                      { Change "movzbl %al, %eax" to "andl $0x0ffh, %eax"}                      begin                        if (cs_asm_source in current_settings.globalswitches) then                          asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var9')),p);                        taicpu(p).opcode := A_AND;                        taicpu(p).changeopsize(S_L);                        taicpu(p).loadConst(0, $ff);                      end                    else if GetNextInstruction(p, hp1) and                      (tai(hp1).typ = ait_instruction) and                      (taicpu(hp1).opcode = A_AND) and                      (taicpu(hp1).oper[0]^.typ = top_const) and                      (taicpu(hp1).oper[1]^.typ = top_reg) and                      (taicpu(hp1).oper[1]^.reg =                      taicpu(p).oper[1]^.reg) then                      { Change "movzbl %reg1, %reg2; andl $const, %reg2"                        to "movl %reg1, reg2; andl $(const1 and $ff), %reg2"}                      begin                        if (cs_asm_source in current_settings.globalswitches) then                          asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var10')),p);                        taicpu(p).opcode := A_MOV;                        taicpu(p).changeopsize(S_L);                        { do not use R_SUBWHOLE                          as movl %rdx,%eax                          is invalid in assembler PM }                        setsubreg(taicpu(p).oper[0]^.reg, R_SUBD);                        taicpu(hp1).loadConst(                          0, taicpu(hp1).oper[0]^.val and $ff);                      end;                    end;                  S_WL:                    begin                    if (getsupreg(taicpu(p).oper[0]^.reg) =                      getsupreg(taicpu(p).oper[1]^.reg)) and  not                      (cs_opt_size in current_settings.optimizerswitches) then                      { Change "movzwl %ax, %eax" to "andl $0x0ffffh, %eax" }                      begin                        if (cs_asm_source in current_settings.globalswitches) then                          asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var11')),p);                        taicpu(p).opcode := A_AND;                        taicpu(p).changeopsize(S_L);                        taicpu(p).loadConst(0, $ffff);                      end                    else if GetNextInstruction(p, hp1) and                      (tai(hp1).typ = ait_instruction) and                      (taicpu(hp1).opcode = A_AND) and                      (taicpu(hp1).oper[0]^.typ = top_const) and                      (taicpu(hp1).oper[1]^.typ = top_reg) and                      (taicpu(hp1).oper[1]^.reg =                      taicpu(p).oper[1]^.reg) then                      { Change "movzwl %reg1, %reg2; andl $const, %reg2"                        to "movl %reg1, reg2; andl $(const1 and $ffff), %reg2"}                      begin                        if (cs_asm_source in current_settings.globalswitches) then                          asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var12')),p);                        taicpu(p).opcode := A_MOV;                        taicpu(p).changeopsize(S_L);                        { do not use R_SUBWHOLE                          as movl %rdx,%eax                          is invalid in assembler PM }                        setsubreg(taicpu(p).oper[0]^.reg, R_SUBD);                        taicpu(hp1).loadConst(                          0, taicpu(hp1).oper[0]^.val and $ffff);                      end;                    end;                  end              else if (taicpu(p).oper[0]^.typ = top_ref) then                begin                if GetNextInstruction(p, hp1) and                  (tai(hp1).typ = ait_instruction) and                  (taicpu(hp1).opcode = A_AND) and                  (taicpu(hp1).oper[0]^.typ = Top_Const) and                  (taicpu(hp1).oper[1]^.typ = Top_Reg) and                  (taicpu(hp1).oper[1]^.reg =                  taicpu(p).oper[1]^.reg) then                  begin                  taicpu(p).opcode := A_MOV;                  case taicpu(p).opsize of                    S_BL:                      begin                        if (cs_asm_source in current_settings.globalswitches) then                          asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var13')),p);                        taicpu(p).changeopsize(S_L);                        taicpu(hp1).loadConst(                          0, taicpu(hp1).oper[0]^.val and $ff);                      end;                    S_WL:                      begin                        if (cs_asm_source in current_settings.globalswitches) then                          asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var14')),p);                        taicpu(p).changeopsize(S_L);                        taicpu(hp1).loadConst(                          0, taicpu(hp1).oper[0]^.val and $ffff);                      end;                    S_BW:                      begin                        if (cs_asm_source in current_settings.globalswitches) then                          asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var15')),p);                        taicpu(p).changeopsize(S_W);                        taicpu(hp1).loadConst(                          0, taicpu(hp1).oper[0]^.val and $ff);                      end;                    S_BQ:                      begin                        if (cs_asm_source in current_settings.globalswitches) then                          asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var16')),p);                        taicpu(p).changeopsize(S_Q);                        taicpu(hp1).loadConst(                          0, taicpu(hp1).oper[0]^.val and $ff);                      end;                    S_WQ:                      begin                        if (cs_asm_source in current_settings.globalswitches) then                          asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var17')),p);                        taicpu(p).changeopsize(S_Q);                        taicpu(hp1).loadConst(                          0, taicpu(hp1).oper[0]^.val and $ffff);                      end;                    S_LQ:                      begin                        if (cs_asm_source in current_settings.globalswitches) then                          asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var18')),p);                        taicpu(p).changeopsize(S_Q);                        taicpu(hp1).loadConst(                          0, taicpu(hp1).oper[0]^.val and $ffffffff);                      end;                    end;                  end;                end;            end;          end;        A_VDIVSD,        A_VDIVSS,        A_VSUBSD,        A_VSUBSS,        A_VMULSD,        A_VMULSS,        A_VADDSD,        A_VADDSS:          begin            if GetNextInstruction(p,hp1) and              { we mix single and double opperations here because we assume that the compiler                generates vmovapd only after double operations and vmovaps only after single operations }              MatchInstruction(hp1,A_VMOVAPD,A_VMOVAPS,[S_NO]) and              MatchOperand(taicpu(p).oper[2]^,taicpu(hp1).oper[0]^) and              (taicpu(hp1).oper[1]^.typ=top_reg) then              begin                CopyUsedRegs(TmpUsedRegs);                UpdateUsedRegs(TmpUsedRegs, tai(p.next));                If not(RegUsedAfterInstruction(taicpu(hp1).oper[0]^.reg,hp1,TmpUsedRegs)) then                  begin                    taicpu(p).loadoper(2,taicpu(hp1).oper[1]^);                    asml.Remove(hp1);                    hp1.Free;                  end;              end;          end;        end;      end;    end;end;begin  casmoptimizer := TCpuAsmOptimizer;end.
 |