123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457 |
- {
- $Id$
- Copyright (c) 1998-2002 by Jonas Maebe, member of the Free Pascal
- development team
- This unit contains register renaming functionality
- This program is free software; you can redistribute it and/or modify
- it under the terms of the GNU General Public License as published by
- the Free Software Foundation; either version 2 of the License, or
- (at your option) any later version.
- This program is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- GNU General Public License for more details.
- You should have received a copy of the GNU General Public License
- along with this program; if not, write to the Free Software
- Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
- ****************************************************************************
- }
- Unit rrOpt386;
- {$i fpcdefs.inc}
- Interface
- Uses aasmbase,aasmtai,aasmcpu;
- procedure doRenaming(asml: TAAsmoutput; first, last: Tai);
- Implementation
- Uses
- {$ifdef replaceregdebug}cutils,{$endif}
- verbose,globals,cpubase,daopt386,csopt386,cginfo,rgobj;
- function canBeFirstSwitch(p: Taicpu; reg: tregister): boolean;
- { checks whether an operation on reg can be switched to another reg without an }
- { additional mov, e.g. "addl $4,%reg1" can be changed to "leal 4(%reg1),%reg2" }
- begin
- canBeFirstSwitch := false;
- case p.opcode of
- A_MOV,A_MOVZX,A_MOVSX,A_LEA:
- canBeFirstSwitch :=
- (p.oper[1].typ = top_reg) and
- (reg32(p.oper[1].reg).enum = reg.enum);
- A_IMUL:
- canBeFirstSwitch :=
- (p.ops >= 2) and
- (reg32(p.oper[p.ops-1].reg).enum = reg.enum) and
- (p.oper[0].typ <> top_ref) and
- (not pTaiprop(p.optinfo)^.FlagsUsed);
- A_INC,A_DEC,A_SUB,A_ADD:
- canBeFirstSwitch :=
- (p.oper[1].typ = top_reg) and
- (p.opsize = S_L) and
- (reg32(p.oper[1].reg).enum = reg.enum) and
- (p.oper[0].typ <> top_ref) and
- ((p.opcode <> A_SUB) or
- (p.oper[0].typ = top_const)) and
- (not pTaiprop(p.optinfo)^.FlagsUsed);
- A_SHL:
- canBeFirstSwitch :=
- (p.opsize = S_L) and
- (p.oper[1].typ = top_reg) and
- (p.oper[1].reg.enum = reg.enum) and
- (p.oper[0].typ = top_const) and
- (p.oper[0].val in [1,2,3]) and
- (not pTaiprop(p.optinfo)^.FlagsUsed);
- end;
- end;
- procedure switchReg(var reg: tregister; reg1, reg2: tregister);
- begin
- if reg1.enum>lastreg then
- internalerror(2003010801);
- if reg2.enum>lastreg then
- internalerror(2003010801);
- if reg.enum>lastreg then
- internalerror(2003010801);
- if reg.enum = reg1.enum then
- reg := reg2
- else if reg.enum = reg2.enum then
- reg := reg1
- else if (reg.enum in regset8bit) then
- begin
- if (reg.enum = changeregsize(reg1,S_B).enum) then
- reg := changeregsize(reg2,S_B)
- else if reg.enum = changeregsize(reg2,S_B).enum then
- reg := changeregsize(reg1,S_B);
- end
- else if (reg.enum in regset16bit) then
- begin
- if reg.enum = changeregsize(reg1,S_W).enum then
- reg := changeregsize(reg2,S_W)
- else if reg.enum = changeregsize(reg2,S_W).enum then
- reg := changeregsize(reg1,S_W);
- end;
- end;
- procedure switchOp(var op: toper; reg1, reg2: tregister);
- begin
- case op.typ of
- top_reg:
- switchReg(op.reg,reg1,reg2);
- top_ref:
- begin
- switchReg(op.ref^.base,reg1,reg2);
- switchReg(op.ref^.index,reg1,reg2);
- end;
- end;
- end;
- procedure doSwitchReg(hp: Taicpu; reg1,reg2: tregister);
- var
- opCount: longint;
- begin
- for opCount := 0 to hp.ops-1 do
- switchOp(hp.oper[opCount],reg1,reg2);
- end;
- procedure doFirstSwitch(p: Taicpu; reg1, reg2: tregister);
- var
- tmpRef: treference;
- begin
- case p.opcode of
- A_MOV,A_MOVZX,A_MOVSX,A_LEA:
- begin
- changeOp(p.oper[1],reg1,reg2);
- changeOp(p.oper[0],reg2,reg1);
- end;
- A_IMUL:
- begin
- p.ops := 3;
- p.loadreg(2,p.oper[1].reg);
- changeOp(p.oper[2],reg1,reg2);
- end;
- A_INC,A_DEC:
- begin
- reference_reset(tmpref);
- tmpref.base := reg1;
- case p.opcode of
- A_INC:
- tmpref.offset := 1;
- A_DEC:
- tmpref.offset := -1;
- end;
- p.ops := 2;
- p.opcode := A_LEA;
- p.loadreg(1,reg2);
- p.loadref(0,tmpref);
- end;
- A_SUB,A_ADD:
- begin
- reference_reset(tmpref);
- tmpref.base := reg1;
- case p.oper[0].typ of
- top_const:
- begin
- tmpref.offset := p.oper[0].val;
- if p.opcode = A_SUB then
- tmpref.offset := - tmpRef.offset;
- end;
- top_symbol:
- tmpref.symbol := p.oper[0].sym;
- top_reg:
- begin
- tmpref.index := p.oper[0].reg;
- tmpref.scalefactor := 1;
- end;
- else internalerror(200010031);
- end;
- p.opcode := A_LEA;
- p.loadref(0,tmpref);
- p.loadreg(1,reg2);
- end;
- A_SHL:
- begin
- reference_reset(tmpref);
- tmpref.index := reg1;
- tmpref.scalefactor := 1 shl p.oper[0].val;
- p.opcode := A_LEA;
- p.loadref(0,tmpref);
- p.loadreg(1,reg2);
- end;
- else internalerror(200010032);
- end;
- end;
- function switchRegs(asml: TAAsmoutput; reg1, reg2: tregister; start: Tai): Boolean;
- { change movl %reg1,%reg2 ... bla ... to ... bla with reg1 and reg2 switched }
- var
- endP, hp, lastreg1,lastreg2: Tai;
- switchDone, switchLast, tmpResult, sequenceEnd, reg1Modified, reg2Modified: boolean;
- reg1StillUsed, reg2StillUsed, isInstruction: boolean;
- begin
- switchRegs := false;
- tmpResult := true;
- sequenceEnd := false;
- reg1Modified := false;
- reg2Modified := false;
- endP := start;
- while tmpResult and not sequenceEnd do
- begin
- tmpResult :=
- getNextInstruction(endP,endP);
- If tmpResult and
- not pTaiprop(endp.optinfo)^.canBeRemoved then
- begin
- { if the newReg gets stored back to the oldReg, we can change }
- { "mov %oldReg,%newReg; <operations on %newReg>; mov %newReg, }
- { %oldReg" to "<operations on %oldReg>" }
- switchLast := storeBack(endP,reg1,reg2);
- reg1StillUsed := reg1.enum in pTaiprop(endp.optinfo)^.usedregs;
- reg2StillUsed := reg2.enum in pTaiprop(endp.optinfo)^.usedregs;
- isInstruction := endp.typ = ait_instruction;
- sequenceEnd :=
- switchLast or
- { if both registers are released right before an instruction }
- { that contains hardcoded regs, it's ok too }
- (not reg1StillUsed and not reg2StillUsed) or
- { no support for (i)div, mul and imul with hardcoded operands }
- (((not isInstruction) or
- noHardCodedRegs(Taicpu(endP),reg1,reg2)) and
- (not reg1StillUsed or
- (isInstruction and findRegDealloc(reg1,endP) and
- regLoadedWithNewValue(reg1,false,Taicpu(endP)))) and
- (not reg2StillUsed or
- (isInstruction and findRegDealloc(reg2,endP) and
- regLoadedWithNewValue(reg2,false,Taicpu(endP)))));
- { we can't switch reg1 and reg2 in something like }
- { movl %reg1,%reg2 }
- { movl (%reg2),%reg2 }
- { movl 4(%reg1),%reg1 }
- if reg2Modified and not(reg1Modified) and
- regReadByInstruction(reg1,endP) then
- begin
- tmpResult := false;
- break
- end;
- if not reg1Modified then
- begin
- reg1Modified := regModifiedByInstruction(reg1,endP);
- if reg1Modified and not canBeFirstSwitch(Taicpu(endP),reg1) then
- begin
- tmpResult := false;
- break;
- end;
- end;
- if not reg2Modified then
- reg2Modified := regModifiedByInstruction(reg2,endP);
- if sequenceEnd then
- break;
- tmpResult :=
- (endp.typ <> ait_label) and
- ((not isInstruction) or
- (NoHardCodedRegs(Taicpu(endP),reg1,reg2) and
- RegSizesOk(reg1,reg2,Taicpu(endP)) and
- (Taicpu(endp).opcode <> A_JMP)));
- end;
- end;
- if tmpResult and sequenceEnd then
- begin
- switchRegs := true;
- reg1Modified := false;
- reg2Modified := false;
- lastreg1 := start;
- lastreg2 := start;
- getNextInstruction(start,hp);
- while hp <> endP do
- begin
- if (not pTaiprop(hp.optinfo)^.canberemoved) and
- (hp.typ = ait_instruction) then
- begin
- switchDone := false;
- if not reg1Modified then
- begin
- reg1Modified := regModifiedByInstruction(reg1,hp);
- if reg1Modified then
- begin
- doFirstSwitch(Taicpu(hp),reg1,reg2);
- switchDone := true;
- end;
- end;
- if not switchDone then
- if reg1Modified then
- doSwitchReg(Taicpu(hp),reg1,reg2)
- else
- doReplaceReg(Taicpu(hp),reg2,reg1);
- end;
- if regininstruction(reg1.enum,hp) then
- lastreg1 := hp;
- if regininstruction(reg2.enum,hp) then
- lastreg2 := hp;
- getNextInstruction(hp,hp);
- end;
- if switchLast then
- doSwitchReg(Taicpu(hp),reg1,reg2)
- else getLastInstruction(hp,hp);
- allocRegBetween(asmL,reg1,start,lastreg1);
- allocRegBetween(asmL,reg2,start,lastreg2);
- end;
- end;
- procedure doRenaming(asml: TAAsmoutput; first, last: Tai);
- var
- p: Tai;
- begin
- p := First;
- SkipHead(p);
- while p <> last do
- begin
- case p.typ of
- ait_instruction:
- begin
- case Taicpu(p).opcode of
- A_MOV:
- begin
- if not(pTaiprop(p.optinfo)^.canBeRemoved) and
- (Taicpu(p).oper[0].typ = top_reg) and
- (Taicpu(p).oper[1].typ = top_reg) and
- (Taicpu(p).opsize = S_L) and
- { (Taicpu(p).oper[0].reg.enum in (rg.usableregsint+[R_EDI])) and
- (Taicpu(p).oper[1].reg.enum in (rg.usableregsint+[R_EDI])) then}
- (Taicpu(p).oper[0].reg.enum in ([R_EDI])) and
- (Taicpu(p).oper[1].reg.enum in ([R_EDI])) then
- if switchRegs(asml,Taicpu(p).oper[0].reg,
- Taicpu(p).oper[1].reg,p) then
- begin
- { getnextinstruction(p,hp);
- asmL^.remove(p);
- dispose(p,done);
- p := hp;
- continue }
- pTaiprop(p.optinfo)^.canBeRemoved := true;
- end;
- end;
- end;
- end;
- end;
- getNextInstruction(p,p);
- end;
- end;
- End.
- {
- $Log$
- Revision 1.22 2003-06-03 21:09:05 peter
- * internal changeregsize for optimizer
- * fix with a hack to not remove the first instruction of a block
- which will leave blockstart pointing to invalid memory
- Revision 1.21 2003/03/28 19:16:57 peter
- * generic constructor working for i386
- * remove fixed self register
- * esi added as address register for i386
- Revision 1.20 2003/02/19 22:00:16 daniel
- * Code generator converted to new register notation
- - Horribily outdated todo.txt removed
- Revision 1.19 2003/01/08 18:43:57 daniel
- * Tregister changed into a record
- Revision 1.18 2002/07/01 18:46:34 peter
- * internal linker
- * reorganized aasm layer
- Revision 1.17 2002/05/18 13:34:26 peter
- * readded missing revisions
- Revision 1.16 2002/05/16 19:46:52 carl
- + defines.inc -> fpcdefs.inc to avoid conflicts if compiling by hand
- + try to fix temp allocation (still in ifdef)
- + generic constructor calls
- + start of tassembler / tmodulebase class cleanup
- Revision 1.14 2002/05/12 16:53:18 peter
- * moved entry and exitcode to ncgutil and cgobj
- * foreach gets extra argument for passing local data to the
- iterator function
- * -CR checks also class typecasts at runtime by changing them
- into as
- * fixed compiler to cycle with the -CR option
- * fixed stabs with elf writer, finally the global variables can
- be watched
- * removed a lot of routines from cga unit and replaced them by
- calls to cgobj
- * u32bit-s32bit updates for and,or,xor nodes. When one element is
- u32bit then the other is typecasted also to u32bit without giving
- a rangecheck warning/error.
- * fixed pascal calling method with reversing also the high tree in
- the parast, detected by tcalcst3 test
- Revision 1.13 2002/04/21 15:42:17 carl
- * changeregsize -> changeregsize
- Revision 1.12 2002/04/20 21:37:08 carl
- + generic FPC_CHECKPOINTER
- + first parameter offset in stack now portable
- * rename some constants
- + move some cpu stuff to other units
- - remove unused constents
- * fix stacksize for some targets
- * fix generic size problems which depend now on EXTEND_SIZE constant
- * removing frame pointer in routines is only available for : i386,m68k and vis targets
- Revision 1.11 2002/04/15 19:44:22 peter
- * fixed stackcheck that would be called recursively when a stack
- error was found
- * generic changeregsize(reg,size) for i386 register resizing
- * removed some more routines from cga unit
- * fixed returnvalue handling
- * fixed default stacksize of linux and go32v2, 8kb was a bit small :-)
- Revision 1.10 2002/04/02 17:11:39 peter
- * tlocation,treference update
- * LOC_CONSTANT added for better constant handling
- * secondadd splitted in multiple routines
- * location_force_reg added for loading a location to a register
- of a specified size
- * secondassignment parses now first the right and then the left node
- (this is compatible with Kylix). This saves a lot of push/pop especially
- with string operations
- * adapted some routines to use the new cg methods
- Revision 1.9 2002/03/31 20:26:41 jonas
- + a_loadfpu_* and a_loadmm_* methods in tcg
- * register allocation is now handled by a class and is mostly processor
- independent (+rgobj.pas and i386/rgcpu.pas)
- * temp allocation is now handled by a class (+tgobj.pas, -i386\tgcpu.pas)
- * some small improvements and fixes to the optimizer
- * some register allocation fixes
- * some fpuvaroffset fixes in the unary minus node
- * push/popusedregisters is now called rg.save/restoreusedregisters and
- (for i386) uses temps instead of push/pop's when using -Op3 (that code is
- also better optimizable)
- * fixed and optimized register saving/restoring for new/dispose nodes
- * LOC_FPU locations now also require their "register" field to be set to
- R_ST, not R_ST0 (the latter is used for LOC_CFPUREGISTER locations only)
- - list field removed of the tnode class because it's not used currently
- and can cause hard-to-find bugs
- }
|