123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383 |
- {
- Copyright (c) 1998-2004 by Jonas Maebe
- This unit calls the optimization procedures to optimize the assembler
- code for sparc
- This program is free software; you can redistribute it and/or modify
- it under the terms of the GNU General Public License as published by
- the Free Software Foundation; either version 2 of the License, or
- (at your option) any later version.
- This program is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- GNU General Public License for more details.
- You should have received a copy of the GNU General Public License
- along with this program; if not, write to the Free Software
- Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
- ****************************************************************************
- }
- unit aoptcpu;
- {$i fpcdefs.inc}
- interface
- uses cgbase, cpubase, aasmtai, aopt, aoptx86, aoptcpub;
- type
- TCpuAsmOptimizer = class(TX86AsmOptimizer)
- function PeepHoleOptPass1Cpu(var p: tai): boolean; override;
- function PeepHoleOptPass2Cpu(var p: tai): boolean; override;
- function PostPeepHoleOptsCpu(var p : tai) : boolean; override;
- end;
- implementation
- uses
- globtype, globals,
- cutils,
- verbose,
- cgutils,
- aoptobj,
- aasmbase, aasmdata, aasmcpu,
- itcpugas;
- function TCpuAsmOptimizer.PeepHoleOptPass1Cpu(var p: tai): boolean;
- var
- hp1, hp2: tai;
- begin
- Result := False;
- case p.typ of
- ait_instruction:
- begin
- case taicpu(p).opcode of
- A_AND:
- Result:=OptPass1AND(p);
- A_MOV:
- Result:=OptPass1MOV(p);
- A_MOVSX,
- A_MOVZX:
- begin
- if (taicpu(p).oper[1]^.typ = top_reg) and
- GetNextInstruction(p, hp1) and
- (hp1.typ = ait_instruction) and
- IsFoldableArithOp(taicpu(hp1), taicpu(p).oper[1]^.reg) and
- GetNextInstruction(hp1, hp2) and
- (hp2.typ = ait_instruction) and
- (taicpu(hp2).opcode = A_MOV) and
- (taicpu(hp2).oper[0]^.typ = top_reg) and
- OpsEqual(taicpu(hp2).oper[1]^, taicpu(p).oper[0]^) then
- { change movsX/movzX reg/ref, reg2 }
- { add/sub/or/... reg3/$const, reg2 }
- { mov reg2 reg/ref }
- { to add/sub/or/... reg3/$const, reg/ref }
- begin
- { by example:
- movswl %si,%eax movswl %si,%eax p
- decl %eax addl %edx,%eax hp1
- movw %ax,%si movw %ax,%si hp2
- ->
- movswl %si,%eax movswl %si,%eax p
- decw %eax addw %edx,%eax hp1
- movw %ax,%si movw %ax,%si hp2
- }
- taicpu(hp1).changeopsize(taicpu(hp2).opsize);
- {
- ->
- movswl %si,%eax movswl %si,%eax p
- decw %si addw %dx,%si hp1
- movw %ax,%si movw %ax,%si hp2
- }
- case taicpu(hp1).ops of
- 1:
- taicpu(hp1).loadoper(0, taicpu(hp2).oper[1]^);
- 2:
- begin
- taicpu(hp1).loadoper(1, taicpu(hp2).oper[1]^);
- if (taicpu(hp1).oper[0]^.typ = top_reg) then
- setsubreg(taicpu(hp1).oper[0]^.reg,
- getsubreg(taicpu(hp2).oper[0]^.reg));
- end;
- else
- internalerror(2008042701);
- end;
- {
- ->
- decw %si addw %dx,%si p
- }
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var3')),p);
- asml.remove(p);
- asml.remove(hp2);
- p.Free;
- hp2.Free;
- p := hp1;
- end
- { removes superfluous And's after movzx's }
- else if taicpu(p).opcode = A_MOVZX then
- begin
- if (taicpu(p).oper[1]^.typ = top_reg) and
- GetNextInstruction(p, hp1) and
- (tai(hp1).typ = ait_instruction) and
- (taicpu(hp1).opcode = A_AND) and
- (taicpu(hp1).oper[0]^.typ = top_const) and
- (taicpu(hp1).oper[1]^.typ = top_reg) and
- (taicpu(hp1).oper[1]^.reg = taicpu(p).oper[1]^.reg) then
- begin
- case taicpu(p).opsize of
- S_BL, S_BW, S_BQ:
- if (taicpu(hp1).oper[0]^.val = $ff) then
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var4')),p);
- asml.remove(hp1);
- hp1.Free;
- end;
- S_WL, S_WQ:
- if (taicpu(hp1).oper[0]^.val = $ffff) then
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var5')),p);
- asml.remove(hp1);
- hp1.Free;
- end;
- S_LQ:
- if (taicpu(hp1).oper[0]^.val = $ffffffff) then
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var6')),p);
- asml.remove(hp1);
- hp1.Free;
- end;
- end;
- end;
- { changes some movzx constructs to faster synonims (all examples
- are given with eax/ax, but are also valid for other registers)}
- if (taicpu(p).oper[1]^.typ = top_reg) then
- if (taicpu(p).oper[0]^.typ = top_reg) then
- case taicpu(p).opsize of
- S_BW:
- begin
- if (getsupreg(taicpu(p).oper[0]^.reg) =
- getsupreg(taicpu(p).oper[1]^.reg)) and not
- (cs_opt_size in current_settings.optimizerswitches) then
- {Change "movzbw %al, %ax" to "andw $0x0ffh, %ax"}
- begin
- taicpu(p).opcode := A_AND;
- taicpu(p).changeopsize(S_W);
- taicpu(p).loadConst(0, $ff);
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var7')),p);
- end
- else if GetNextInstruction(p, hp1) and
- (tai(hp1).typ = ait_instruction) and
- (taicpu(hp1).opcode = A_AND) and
- (taicpu(hp1).oper[0]^.typ = top_const) and
- (taicpu(hp1).oper[1]^.typ = top_reg) and
- (taicpu(hp1).oper[1]^.reg =
- taicpu(p).oper[1]^.reg) then
- { Change "movzbw %reg1, %reg2; andw $const, %reg2"
- to "movw %reg1, reg2; andw $(const1 and $ff), %reg2"}
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var8')),p);
- taicpu(p).opcode := A_MOV;
- taicpu(p).changeopsize(S_W);
- setsubreg(taicpu(p).oper[0]^.reg, R_SUBW);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ff);
- end;
- end;
- S_BL:
- begin
- if (getsupreg(taicpu(p).oper[0]^.reg) =
- getsupreg(taicpu(p).oper[1]^.reg)) and not
- (cs_opt_size in current_settings.optimizerswitches) then
- { Change "movzbl %al, %eax" to "andl $0x0ffh, %eax"}
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var9')),p);
- taicpu(p).opcode := A_AND;
- taicpu(p).changeopsize(S_L);
- taicpu(p).loadConst(0, $ff);
- end
- else if GetNextInstruction(p, hp1) and
- (tai(hp1).typ = ait_instruction) and
- (taicpu(hp1).opcode = A_AND) and
- (taicpu(hp1).oper[0]^.typ = top_const) and
- (taicpu(hp1).oper[1]^.typ = top_reg) and
- (taicpu(hp1).oper[1]^.reg =
- taicpu(p).oper[1]^.reg) then
- { Change "movzbl %reg1, %reg2; andl $const, %reg2"
- to "movl %reg1, reg2; andl $(const1 and $ff), %reg2"}
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var10')),p);
- taicpu(p).opcode := A_MOV;
- taicpu(p).changeopsize(S_L);
- { do not use R_SUBWHOLE
- as movl %rdx,%eax
- is invalid in assembler PM }
- setsubreg(taicpu(p).oper[0]^.reg, R_SUBD);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ff);
- end;
- end;
- S_WL:
- begin
- if (getsupreg(taicpu(p).oper[0]^.reg) =
- getsupreg(taicpu(p).oper[1]^.reg)) and not
- (cs_opt_size in current_settings.optimizerswitches) then
- { Change "movzwl %ax, %eax" to "andl $0x0ffffh, %eax" }
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var11')),p);
- taicpu(p).opcode := A_AND;
- taicpu(p).changeopsize(S_L);
- taicpu(p).loadConst(0, $ffff);
- end
- else if GetNextInstruction(p, hp1) and
- (tai(hp1).typ = ait_instruction) and
- (taicpu(hp1).opcode = A_AND) and
- (taicpu(hp1).oper[0]^.typ = top_const) and
- (taicpu(hp1).oper[1]^.typ = top_reg) and
- (taicpu(hp1).oper[1]^.reg =
- taicpu(p).oper[1]^.reg) then
- { Change "movzwl %reg1, %reg2; andl $const, %reg2"
- to "movl %reg1, reg2; andl $(const1 and $ffff), %reg2"}
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var12')),p);
- taicpu(p).opcode := A_MOV;
- taicpu(p).changeopsize(S_L);
- { do not use R_SUBWHOLE
- as movl %rdx,%eax
- is invalid in assembler PM }
- setsubreg(taicpu(p).oper[0]^.reg, R_SUBD);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ffff);
- end;
- end;
- end
- else if (taicpu(p).oper[0]^.typ = top_ref) then
- begin
- if GetNextInstruction(p, hp1) and
- (tai(hp1).typ = ait_instruction) and
- (taicpu(hp1).opcode = A_AND) and
- MatchOpType(taicpu(hp1),top_const,top_reg) and
- (taicpu(hp1).oper[1]^.reg =
- taicpu(p).oper[1]^.reg) then
- begin
- taicpu(p).opcode := A_MOV;
- case taicpu(p).opsize of
- S_BL:
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var13')),p);
- taicpu(p).changeopsize(S_L);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ff);
- end;
- S_WL:
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var14')),p);
- taicpu(p).changeopsize(S_L);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ffff);
- end;
- S_BW:
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var15')),p);
- taicpu(p).changeopsize(S_W);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ff);
- end;
- S_BQ:
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var16')),p);
- taicpu(p).changeopsize(S_Q);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ff);
- end;
- S_WQ:
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var17')),p);
- taicpu(p).changeopsize(S_Q);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ffff);
- end;
- S_LQ:
- begin
- if (cs_asm_source in current_settings.globalswitches) then
- asml.insertbefore(tai_comment.create(strpnew('PeepHole Optimization,var18')),p);
- taicpu(p).changeopsize(S_Q);
- taicpu(hp1).loadConst(
- 0, taicpu(hp1).oper[0]^.val and $ffffffff);
- end;
- end;
- end;
- end;
- end;
- end;
- A_VMOVAPS,
- A_VMOVAPD:
- result:=OptPass1VMOVAP(p);
- A_VDIVSD,
- A_VDIVSS,
- A_VSUBSD,
- A_VSUBSS,
- A_VMULSD,
- A_VMULSS,
- A_VADDSD,
- A_VADDSS:
- result:=OptPass1VOP(p);
- end;
- end;
- end;
- end;
- function TCpuAsmOptimizer.PeepHoleOptPass2Cpu(var p : tai) : boolean;
- begin
- Result := False;
- case p.typ of
- ait_instruction:
- begin
- case taicpu(p).opcode of
- A_MOV:
- Result:=OptPass2MOV(p);
- A_IMUL:
- Result:=OptPass2Imul(p);
- end;
- end;
- end;
- end;
- function TCpuAsmOptimizer.PostPeepHoleOptsCpu(var p: tai): boolean;
- begin
- result := false;
- case p.typ of
- ait_instruction:
- begin
- case taicpu(p).opcode of
- A_MOV:
- PostPeepholeOptMov(p);
- end;
- end;
- end;
- end;
- begin
- casmoptimizer := TCpuAsmOptimizer;
- end.
|