123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632 |
- {
- Copyright (c) 1998-2004 by Jonas Maebe
- This unit calls the optimization procedures to optimize the assembler
- code for sparc
- This program is free software; you can redistribute it and/or modify
- it under the terms of the GNU General Public License as published by
- the Free Software Foundation; either version 2 of the License, or
- (at your option) any later version.
- This program is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- GNU General Public License for more details.
- You should have received a copy of the GNU General Public License
- along with this program; if not, write to the Free Software
- Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
- ****************************************************************************
- }
- unit aoptcpu;
- {$i fpcdefs.inc}
- interface
- uses cgbase, cpubase, aasmtai, aopt, aoptx86, aoptcpub;
- type
- TCpuAsmOptimizer = class(TX86AsmOptimizer)
- function PeepHoleOptPass1Cpu(var p: tai): boolean; override;
- function PostPeepHoleOptsCpu(var p : tai) : boolean; override;
- end;
- implementation
- uses
- globtype, globals,
- cutils,
- verbose,
- cgutils,
- aoptobj,
- aasmbase, aasmdata, aasmcpu,
- itcpugas;
- function isFoldableArithOp(hp1: taicpu; reg: tregister): boolean;
- begin
- isFoldableArithOp := False;
- case hp1.opcode of
- A_ADD, A_SUB, A_OR, A_XOR, A_AND, A_SHL, A_SHR, A_SAR:
- isFoldableArithOp :=
- (taicpu(hp1).oper[1]^.typ = top_reg) and
- (taicpu(hp1).oper[1]^.reg = reg) and
- ((taicpu(hp1).oper[0]^.typ = top_const) or
- ((taicpu(hp1).oper[0]^.typ = top_reg) and
- (taicpu(hp1).oper[0]^.reg<>reg)));
- A_INC, A_DEC:
- isFoldableArithOp :=
- (taicpu(hp1).oper[0]^.typ = top_reg) and
- (taicpu(hp1).oper[0]^.reg = reg);
- end;
- end;
- function TCpuAsmOptimizer.PeepHoleOptPass1Cpu(var p: tai): boolean;
- var
- hp1, hp2: tai;
- GetNextIntruction_p : boolean;
- TmpUsedRegs : TAllUsedRegs;
- begin
- Result := False;
- case p.typ of
- ait_instruction:
- begin
- case taicpu(p).opcode of
- A_AND:
- begin
- if (taicpu(p).oper[0]^.typ = top_const) and
- (taicpu(p).oper[1]^.typ = top_reg) and
- GetNextInstruction(p, hp1) and
- (tai(hp1).typ = ait_instruction) and
- (taicpu(hp1).opcode = A_AND) and
- (taicpu(hp1).oper[0]^.typ = top_const) and
- (taicpu(hp1).oper[1]^.typ = top_reg) and
- (getsupreg(taicpu(p).oper[1]^.reg) = getsupreg(
- taicpu(hp1).oper[1]^.reg)) and
- (getsubreg(taicpu(p).oper[1]^.reg)<=getsubreg(
- taicpu(hp1).oper[1]^.reg)) and
- (abs(taicpu(p).oper[0]^.val and
- taicpu(hp1).oper[0]^.val)<$80000000) then
- {change "and const1, reg; and const2, reg" to "and (const1 and const2), reg"}
- begin
- taicpu(hp1).loadConst(0, taicpu(p).oper[0]^.val and
- taicpu(hp1).oper[0]^.val);
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var1')),p);
- asml.remove(p);
- p.Free;
- p:=hp1;
- end
- else if (taicpu(p).oper[0]^.typ = top_const) and
- (taicpu(p).oper[1]^.typ = top_reg) and
- GetNextInstruction(p, hp1) and
- MatchInstruction(hp1,A_MOVZX,[]) and
- (taicpu(hp1).oper[0]^.typ = top_reg) and
- MatchOperand(taicpu(p).oper[1]^,taicpu(hp1).oper[1]^) and
- (getsubreg(taicpu(hp1).oper[0]^.reg)=getsubreg(taicpu(hp1).oper[1]^.reg)) and
- (((taicpu(p).opsize=S_W) and
- (taicpu(hp1).opsize=S_BW)) or
- ((taicpu(p).opsize=S_L) and
- (taicpu(hp1).opsize in [S_WL,S_BL])) or
- ((taicpu(p).opsize=S_Q) and
- (taicpu(hp1).opsize in [S_BQ,S_WQ,S_LQ]))
- ) then
- begin
- if (((taicpu(hp1).opsize) in [S_BW,S_BL,S_BQ]) and
- ((taicpu(p).oper[0]^.val and $ff)=taicpu(p).oper[0]^.val)) or
- (((taicpu(hp1).opsize) in [S_WL,S_WQ]) and
- ((taicpu(p).oper[0]^.val and $ffff)=taicpu(p).oper[0]^.val)) or
- (((taicpu(hp1).opsize)=S_LQ) and
- ((taicpu(p).oper[0]^.val and $ffffffff)=taicpu(p).oper[0]^.val)
- ) then
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,AndMovzToAnd')),p);
- asml.remove(hp1);
- hp1.free;
- end;
- end
- else if (taicpu(p).oper[0]^.typ = top_const) and
- (taicpu(p).oper[1]^.typ = top_reg) and
- GetNextInstruction(p, hp1) and
- MatchInstruction(hp1,A_MOVSX,A_MOVSXD,[]) and
- (taicpu(hp1).oper[0]^.typ = top_reg) and
- MatchOperand(taicpu(p).oper[1]^,taicpu(hp1).oper[1]^) and
- (getsupreg(taicpu(hp1).oper[0]^.reg)=getsupreg(taicpu(hp1).oper[1]^.reg)) and
- (((taicpu(p).opsize=S_W) and
- (taicpu(hp1).opsize=S_BW)) or
- ((taicpu(p).opsize=S_L) and
- (taicpu(hp1).opsize in [S_WL,S_BL])) or
- ((taicpu(p).opsize=S_Q) and
- (taicpu(hp1).opsize in [S_BQ,S_WQ,S_LQ]))
- ) then
- begin
- if (((taicpu(hp1).opsize) in [S_BW,S_BL,S_BQ]) and
- ((taicpu(p).oper[0]^.val and $7f)=taicpu(p).oper[0]^.val)) or
- (((taicpu(hp1).opsize) in [S_WL,S_WQ]) and
- ((taicpu(p).oper[0]^.val and $7fff)=taicpu(p).oper[0]^.val)) or
- (((taicpu(hp1).opsize)=S_LQ) and
- ((taicpu(p).oper[0]^.val and $7fffffff)=taicpu(p).oper[0]^.val)
- ) then
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,AndMovsxToAnd')),p);
- asml.remove(hp1);
- hp1.free;
- end;
- end;
- (* else
- {change "and x, reg; jxx" to "test x, reg", if reg is deallocated before the
- jump, but only if it's a conditional jump (PFV) }
- if (taicpu(p).oper[1]^.typ = top_reg) and
- GetNextInstruction(p, hp1) and
- (hp1.typ = ait_instruction) and
- (taicpu(hp1).is_jmp) and
- (taicpu(hp1).opcode<>A_JMP) and
- not(getsupreg(taicpu(p).oper[1]^.reg) in UsedRegs) then
- taicpu(p).opcode := A_TEST;*)
- end;
- A_MOV:
- { removes superfluous And's after mov's }
- begin
- if not(cs_opt_level3 in current_settings.optimizerswitches) then
- exit;
- GetNextIntruction_p:=GetNextInstruction(p, hp1);
- if (taicpu(p).oper[1]^.typ = top_reg) and
- GetNextIntruction_p and
- (tai(hp1).typ = ait_instruction) and
- (taicpu(hp1).opcode = A_AND) and
- (taicpu(hp1).oper[0]^.typ = top_const) and
- (taicpu(hp1).oper[1]^.typ = top_reg) and
- (taicpu(hp1).oper[1]^.reg = taicpu(p).oper[1]^.reg) then
- case taicpu(p).opsize Of
- S_L:
- if (taicpu(hp1).oper[0]^.val = $ffffffff) then
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var2a')),p);
- asml.remove(hp1);
- hp1.free;
- end;
- end
- { Next instruction is also a MOV ? }
- else if GetNextIntruction_p and
- MatchInstruction(hp1,A_MOV,[taicpu(p).opsize]) then
- begin
- if (taicpu(hp1).oper[0]^.typ = taicpu(p).oper[1]^.typ) and
- (taicpu(hp1).oper[1]^.typ = taicpu(p).oper[0]^.typ) then
- {mov reg1, mem1 or mov mem1, reg1
- mov mem2, reg2 mov reg2, mem2}
- begin
- if OpsEqual(taicpu(hp1).oper[1]^,taicpu(p).oper[0]^) then
- {mov reg1, mem1 or mov mem1, reg1
- mov mem2, reg1 mov reg2, mem1}
- begin
- if OpsEqual(taicpu(hp1).oper[0]^,taicpu(p).oper[1]^) then
- { Removes the second statement from
- mov reg1, mem1/reg2
- mov mem1/reg2, reg1 }
- begin
- { if (taicpu(p).oper[0]^.typ = top_reg) then
- AllocRegBetween(asmL,taicpu(p).oper[0]^.reg,p,hp1,usedregs); }
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,MovMov2Mov1')),p);
- asml.remove(hp1);
- hp1.free;
- end;
- end
- else if (taicpu(p).oper[1]^.typ=top_ref) and
- OpsEqual(taicpu(hp1).oper[0]^,taicpu(p).oper[1]^) then
- begin
- taicpu(hp1).loadreg(0,taicpu(p).oper[0]^.reg);
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,MovMov2MovMov1')),p);
- end;
- end
- end
- else if (taicpu(p).oper[1]^.typ = top_reg) and
- GetNextIntruction_p and
- (hp1.typ = ait_instruction) and
- GetNextInstruction(hp1, hp2) and
- (hp2.typ = ait_instruction) and
- (taicpu(hp2).opcode = A_MOV) and
- (taicpu(hp2).oper[0]^.typ = top_reg) and
- OpsEqual(taicpu(hp2).oper[1]^, taicpu(p).oper[0]^) and
- (IsFoldableArithOp(taicpu(hp1), taicpu(p).oper[1]^.reg) or
- ((taicpu(p).opsize=S_L) and (taicpu(hp1).opsize=S_Q) and
- IsFoldableArithOp(taicpu(hp1), newreg(R_INTREGISTER,getsupreg(taicpu(p).oper[1]^.reg),R_SUBQ)))
- ) then
- { change movsX/movzX reg/ref, reg2 }
- { add/sub/or/... reg3/$const, reg2 }
- { mov reg2 reg/ref }
- { to add/sub/or/... reg3/$const, reg/ref }
- begin
- CopyUsedRegs(TmpUsedRegs);
- UpdateUsedRegs(TmpUsedRegs, tai(p.next));
- UpdateUsedRegs(TmpUsedRegs, tai(hp1.next));
- If not(RegUsedAfterInstruction(taicpu(p).oper[1]^.reg,hp2,TmpUsedRegs)) then
- begin
- { by example:
- movswl %si,%eax movswl %si,%eax p
- decl %eax addl %edx,%eax hp1
- movw %ax,%si movw %ax,%si hp2
- ->
- movswl %si,%eax movswl %si,%eax p
- decw %eax addw %edx,%eax hp1
- movw %ax,%si movw %ax,%si hp2
- }
- if (cs_asm_source in current_settings.globalswitches) then
- begin
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var2')),p);
- asml.insertbefore(tai_comment.create(strpnew('P='+std_op2str[taicpu(p).opcode]+gas_opsize2str[taicpu(p).opsize])),p);
- asml.insertbefore(tai_comment.create(strpnew('HP1='+std_op2str[taicpu(hp1).opcode]+gas_opsize2str[taicpu(hp1).opsize])),p);
- asml.insertbefore(tai_comment.create(strpnew('HP2='+std_op2str[taicpu(hp2).opcode]+gas_opsize2str[taicpu(hp2).opsize])),p);
- end;
- taicpu(hp1).changeopsize(taicpu(p).opsize);
- {
- ->
- movswl %si,%eax movswl %si,%eax p
- decw %si addw %dx,%si hp1
- movw %ax,%si movw %ax,%si hp2
- }
- case taicpu(hp1).ops of
- 1:
- begin
- taicpu(hp1).loadoper(0, taicpu(hp2).oper[1]^);
- if taicpu(hp1).oper[0]^.typ=top_reg then
- setsubreg(taicpu(hp1).oper[0]^.reg,getsubreg(taicpu(p).oper[1]^.reg));
- end;
- 2:
- begin
- taicpu(hp1).loadoper(1, taicpu(hp2).oper[1]^);
- if (taicpu(hp1).oper[0]^.typ=top_reg) and
- (taicpu(hp1).opcode<>A_SHL) and
- (taicpu(hp1).opcode<>A_SHR) and
- (taicpu(hp1).opcode<>A_SAR) then
- setsubreg(taicpu(hp1).oper[0]^.reg,getsubreg(taicpu(p).oper[1]^.reg));
- end;
- else
- internalerror(2008042701);
- end;
- {
- ->
- decw %si addw %dx,%si p
- }
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var2')),p);
- asml.remove(p);
- asml.remove(hp2);
- p.Free;
- hp2.Free;
- p := hp1;
- end;
- ReleaseUsedRegs(TmpUsedRegs);
- end
- end;
- A_MOVSX,
- A_MOVZX:
- begin
- if (taicpu(p).oper[1]^.typ = top_reg) and
- GetNextInstruction(p, hp1) and
- (hp1.typ = ait_instruction) and
- IsFoldableArithOp(taicpu(hp1), taicpu(p).oper[1]^.reg) and
- GetNextInstruction(hp1, hp2) and
- (hp2.typ = ait_instruction) and
- (taicpu(hp2).opcode = A_MOV) and
- (taicpu(hp2).oper[0]^.typ = top_reg) and
- OpsEqual(taicpu(hp2).oper[1]^, taicpu(p).oper[0]^) then
- { change movsX/movzX reg/ref, reg2 }
- { add/sub/or/... reg3/$const, reg2 }
- { mov reg2 reg/ref }
- { to add/sub/or/... reg3/$const, reg/ref }
- begin
- { by example:
- movswl %si,%eax movswl %si,%eax p
- decl %eax addl %edx,%eax hp1
- movw %ax,%si movw %ax,%si hp2
- ->
- movswl %si,%eax movswl %si,%eax p
- decw %eax addw %edx,%eax hp1
- movw %ax,%si movw %ax,%si hp2
- }
- taicpu(hp1).changeopsize(taicpu(hp2).opsize);
- {
- ->
- movswl %si,%eax movswl %si,%eax p
- decw %si addw %dx,%si hp1
- movw %ax,%si movw %ax,%si hp2
- }
- case taicpu(hp1).ops of
- 1:
- taicpu(hp1).loadoper(0, taicpu(hp2).oper[1]^);
- 2:
- begin
- taicpu(hp1).loadoper(1, taicpu(hp2).oper[1]^);
- if (taicpu(hp1).oper[0]^.typ = top_reg) then
- setsubreg(taicpu(hp1).oper[0]^.reg,
- getsubreg(taicpu(hp2).oper[0]^.reg));
- end;
- else
- internalerror(2008042701);
- end;
- {
- ->
- decw %si addw %dx,%si p
- }
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var3')),p);
- asml.remove(p);
- asml.remove(hp2);
- p.Free;
- hp2.Free;
- p := hp1;
- end
- { removes superfluous And's after movzx's }
- else if taicpu(p).opcode = A_MOVZX then
- begin
- if (taicpu(p).oper[1]^.typ = top_reg) and
- GetNextInstruction(p, hp1) and
- (tai(hp1).typ = ait_instruction) and
- (taicpu(hp1).opcode = A_AND) and
- (taicpu(hp1).oper[0]^.typ = top_const) and
- (taicpu(hp1).oper[1]^.typ = top_reg) and
- (taicpu(hp1).oper[1]^.reg = taicpu(p).oper[1]^.reg) then
- begin
- case taicpu(p).opsize of
- S_BL, S_BW, S_BQ:
- if (taicpu(hp1).oper[0]^.val = $ff) then
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var4')),p);
- asml.remove(hp1);
- hp1.Free;
- end;
- S_WL, S_WQ:
- if (taicpu(hp1).oper[0]^.val = $ffff) then
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var5')),p);
- asml.remove(hp1);
- hp1.Free;
- end;
- S_LQ:
- if (taicpu(hp1).oper[0]^.val = $ffffffff) then
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var6')),p);
- asml.remove(hp1);
- hp1.Free;
- end;
- end;
- end;
- { changes some movzx constructs to faster synonims (all examples
- are given with eax/ax, but are also valid for other registers)}
- if (taicpu(p).oper[1]^.typ = top_reg) then
- if (taicpu(p).oper[0]^.typ = top_reg) then
- case taicpu(p).opsize of
- S_BW:
- begin
- if (getsupreg(taicpu(p).oper[0]^.reg) =
- getsupreg(taicpu(p).oper[1]^.reg)) and not
- (cs_opt_size in current_settings.optimizerswitches) then
- {Change "movzbw %al, %ax" to "andw $0x0ffh, %ax"}
- begin
- taicpu(p).opcode := A_AND;
- taicpu(p).changeopsize(S_W);
- taicpu(p).loadConst(0, $ff);
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var7')),p);
- end
- else if GetNextInstruction(p, hp1) and
- (tai(hp1).typ = ait_instruction) and
- (taicpu(hp1).opcode = A_AND) and
- (taicpu(hp1).oper[0]^.typ = top_const) and
- (taicpu(hp1).oper[1]^.typ = top_reg) and
- (taicpu(hp1).oper[1]^.reg =
- taicpu(p).oper[1]^.reg) then
- { Change "movzbw %reg1, %reg2; andw $const, %reg2"
- to "movw %reg1, reg2; andw $(const1 and $ff), %reg2"}
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var8')),p);
- taicpu(p).opcode := A_MOV;
- taicpu(p).changeopsize(S_W);
- setsubreg(taicpu(p).oper[0]^.reg, R_SUBW);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ff);
- end;
- end;
- S_BL:
- begin
- if (getsupreg(taicpu(p).oper[0]^.reg) =
- getsupreg(taicpu(p).oper[1]^.reg)) and not
- (cs_opt_size in current_settings.optimizerswitches) then
- { Change "movzbl %al, %eax" to "andl $0x0ffh, %eax"}
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var9')),p);
- taicpu(p).opcode := A_AND;
- taicpu(p).changeopsize(S_L);
- taicpu(p).loadConst(0, $ff);
- end
- else if GetNextInstruction(p, hp1) and
- (tai(hp1).typ = ait_instruction) and
- (taicpu(hp1).opcode = A_AND) and
- (taicpu(hp1).oper[0]^.typ = top_const) and
- (taicpu(hp1).oper[1]^.typ = top_reg) and
- (taicpu(hp1).oper[1]^.reg =
- taicpu(p).oper[1]^.reg) then
- { Change "movzbl %reg1, %reg2; andl $const, %reg2"
- to "movl %reg1, reg2; andl $(const1 and $ff), %reg2"}
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var10')),p);
- taicpu(p).opcode := A_MOV;
- taicpu(p).changeopsize(S_L);
- { do not use R_SUBWHOLE
- as movl %rdx,%eax
- is invalid in assembler PM }
- setsubreg(taicpu(p).oper[0]^.reg, R_SUBD);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ff);
- end;
- end;
- S_WL:
- begin
- if (getsupreg(taicpu(p).oper[0]^.reg) =
- getsupreg(taicpu(p).oper[1]^.reg)) and not
- (cs_opt_size in current_settings.optimizerswitches) then
- { Change "movzwl %ax, %eax" to "andl $0x0ffffh, %eax" }
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var11')),p);
- taicpu(p).opcode := A_AND;
- taicpu(p).changeopsize(S_L);
- taicpu(p).loadConst(0, $ffff);
- end
- else if GetNextInstruction(p, hp1) and
- (tai(hp1).typ = ait_instruction) and
- (taicpu(hp1).opcode = A_AND) and
- (taicpu(hp1).oper[0]^.typ = top_const) and
- (taicpu(hp1).oper[1]^.typ = top_reg) and
- (taicpu(hp1).oper[1]^.reg =
- taicpu(p).oper[1]^.reg) then
- { Change "movzwl %reg1, %reg2; andl $const, %reg2"
- to "movl %reg1, reg2; andl $(const1 and $ffff), %reg2"}
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var12')),p);
- taicpu(p).opcode := A_MOV;
- taicpu(p).changeopsize(S_L);
- { do not use R_SUBWHOLE
- as movl %rdx,%eax
- is invalid in assembler PM }
- setsubreg(taicpu(p).oper[0]^.reg, R_SUBD);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ffff);
- end;
- end;
- end
- else if (taicpu(p).oper[0]^.typ = top_ref) then
- begin
- if GetNextInstruction(p, hp1) and
- (tai(hp1).typ = ait_instruction) and
- (taicpu(hp1).opcode = A_AND) and
- MatchOpType(taicpu(hp1),top_const,top_reg) and
- (taicpu(hp1).oper[1]^.reg =
- taicpu(p).oper[1]^.reg) then
- begin
- taicpu(p).opcode := A_MOV;
- case taicpu(p).opsize of
- S_BL:
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var13')),p);
- taicpu(p).changeopsize(S_L);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ff);
- end;
- S_WL:
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var14')),p);
- taicpu(p).changeopsize(S_L);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ffff);
- end;
- S_BW:
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var15')),p);
- taicpu(p).changeopsize(S_W);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ff);
- end;
- S_BQ:
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var16')),p);
- taicpu(p).changeopsize(S_Q);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ff);
- end;
- S_WQ:
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var17')),p);
- taicpu(p).changeopsize(S_Q);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ffff);
- end;
- S_LQ:
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var18')),p);
- taicpu(p).changeopsize(S_Q);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ffffffff);
- end;
- end;
- end;
- end;
- end;
- end;
- A_VMOVAPS,
- A_VMOVAPD:
- result:=OptPass1VMOVAP(p);
- A_VDIVSD,
- A_VDIVSS,
- A_VSUBSD,
- A_VSUBSS,
- A_VMULSD,
- A_VMULSS,
- A_VADDSD,
- A_VADDSS:
- begin
- if GetNextInstruction(p,hp1) and
- { we mix single and double opperations here because we assume that the compiler
- generates vmovapd only after double operations and vmovaps only after single operations }
- MatchInstruction(hp1,A_VMOVAPD,A_VMOVAPS,[S_NO]) and
- MatchOperand(taicpu(p).oper[2]^,taicpu(hp1).oper[0]^) and
- (taicpu(hp1).oper[1]^.typ=top_reg) then
- begin
- CopyUsedRegs(TmpUsedRegs);
- UpdateUsedRegs(TmpUsedRegs, tai(p.next));
- If not(RegUsedAfterInstruction(taicpu(hp1).oper[0]^.reg,hp1,TmpUsedRegs)) then
- begin
- taicpu(p).loadoper(2,taicpu(hp1).oper[1]^);
- asml.Remove(hp1);
- hp1.Free;
- end;
- end;
- end;
- end;
- end;
- end;
- end;
- function TCpuAsmOptimizer.PostPeepHoleOptsCpu(var p: tai): boolean;
- begin
- result := false;
- case p.typ of
- ait_instruction:
- begin
- case taicpu(p).opcode of
- A_MOV:
- PostPeepholeOptMov(p);
- end;
- end;
- end;
- end;
- begin
- casmoptimizer := TCpuAsmOptimizer;
- end.
|