| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401 | {    Copyright (c) 1998-2002 by Florian Klaempfl    This unit implements the x86 specific class for the register    allocator    This program is free software; you can redistribute it and/or modify    it under the terms of the GNU General Public License as published by    the Free Software Foundation; either version 2 of the License, or    (at your option) any later version.    This program is distributed in the hope that it will be useful,    but WITHOUT ANY WARRANTY; without even the implied warranty of    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the    GNU General Public License for more details.    You should have received a copy of the GNU General Public License    along with this program; if not, write to the Free Software    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. ****************************************************************************}unit rgx86;{$i fpcdefs.inc}  interface    uses      cclasses,globtype,      cpubase,cpuinfo,cgbase,cgutils,      aasmbase,aasmtai,aasmdata,aasmcpu,      rgobj;    type       trgx86 = class(trgobj)         function  get_spill_subreg(r : tregister) : tsubregister;override;         function  do_spill_replace(list:TAsmList;instr:taicpu;orgreg:tsuperregister;const spilltemp:treference):boolean;override;       end;       tpushedsavedloc = record         case byte of           0: (pushed: boolean);           1: (ofs: longint);       end;       tpushedsavedfpu = array[tsuperregister] of tpushedsavedloc;       trgx86fpu = class          { The "usableregsxxx" contain all registers of type "xxx" that }          { aren't currently allocated to a regvar. The "unusedregsxxx"  }          { contain all registers of type "xxx" that aren't currently    }          { allocated                                                    }          unusedregsfpu,usableregsfpu : Tsuperregisterset;          { these counters contain the number of elements in the }          { unusedregsxxx/usableregsxxx sets                     }          countunusedregsfpu : byte;          { Contains the registers which are really used by the proc itself.            It doesn't take care of registers used by called procedures          }          used_in_proc : tcpuregisterset;          {reg_pushes_other : regvarother_longintarray;          is_reg_var_other : regvarother_booleanarray;          regvar_loaded_other : regvarother_booleanarray;}          fpuvaroffset : byte;          constructor create;          function getregisterfpu(list: TAsmList) : tregister;          procedure ungetregisterfpu(list: TAsmList; r : tregister);          { pushes and restores registers }          procedure saveusedfpuregisters(list:TAsmList;                                         var saved:Tpushedsavedfpu;                                         const s:Tcpuregisterset);          procedure restoreusedfpuregisters(list:TAsmList;                                            const saved:Tpushedsavedfpu);          { corrects the fpu stack register by ofs }          function correct_fpuregister(r : tregister;ofs : byte) : tregister;       end;implementation    uses       systems,       verbose;    const       { This value is used in tsaved. If the array value is equal         to this, then this means that this register is not used.}       reg_not_saved = $7fffffff;{******************************************************************************                                    Trgcpu******************************************************************************}    function trgx86.get_spill_subreg(r : tregister) : tsubregister;      begin        result:=getsubreg(r);      end;    function trgx86.do_spill_replace(list:TAsmList;instr:taicpu;orgreg:tsuperregister;const spilltemp:treference):boolean;    {Decide wether a "replace" spill is possible, i.e. wether we can replace a register     in an instruction by a memory reference. For example, in "mov ireg26d,0", the imaginary     register ireg26d can be replaced by a memory reference.}      var        n,replaceoper : longint;      begin        result:=false;        with instr do          begin            replaceoper:=-1;            case ops of              1 :                begin                  if (oper[0]^.typ=top_reg) and                     (getregtype(oper[0]^.reg)=regtype) then                    begin                      if get_alias(getsupreg(oper[0]^.reg))<>orgreg then                        internalerror(200410101);                      replaceoper:=0;                    end;                end;              2,3 :                begin                  { We can handle opcodes with 2 and 3 operands the same way. The opcodes                    with 3 registers are shrd/shld, where the 3rd operand is const or CL,                    that doesn't need spilling.                    However, due to AT&T order inside the compiler, the 3rd operand is                    numbered 0, so look at operand no. 1 and 2 if we have 3 operands by                    adding a "n". }                  n:=0;                  if ops=3 then                    n:=1;                  if (oper[n+0]^.typ=top_reg) and                     (oper[n+1]^.typ=top_reg) and                     ((getregtype(oper[n+0]^.reg)<>regtype) or                      (getregtype(oper[n+1]^.reg)<>regtype) or                      (get_alias(getsupreg(oper[n+0]^.reg))<>get_alias(getsupreg(oper[n+1]^.reg)))) then                    begin                      if (getregtype(oper[n+0]^.reg)=regtype) and                         (get_alias(getsupreg(oper[n+0]^.reg))=orgreg) then                        replaceoper:=0+n                      else if (getregtype(oper[n+1]^.reg)=regtype) and                         (get_alias(getsupreg(oper[n+1]^.reg))=orgreg) then                        replaceoper:=1+n;                    end                  else if (oper[n+0]^.typ=top_reg) and                     (oper[n+1]^.typ=top_const) then                    begin                      if (getregtype(oper[0+n]^.reg)=regtype) and                         (get_alias(getsupreg(oper[0+n]^.reg))=orgreg) then                        replaceoper:=0+n                      else                        internalerror(200704282);                    end                  else if (oper[n+0]^.typ=top_const) and                     (oper[n+1]^.typ=top_reg) then                    begin                      if (getregtype(oper[1+n]^.reg)=regtype) and                         (get_alias(getsupreg(oper[1+n]^.reg))=orgreg) then                        replaceoper:=1+n                      else                        internalerror(200704283);                    end;                  case replaceoper of                    0 :                      begin                        { Some instructions don't allow memory references                          for source }                        case instr.opcode of                          A_BT,                          A_BTS,                          A_BTC,                          A_BTR :                            replaceoper:=-1;                        end;                      end;                    1 :                      begin                        { Some instructions don't allow memory references                          for destination }                        case instr.opcode of                          A_MOVZX,                          A_MOVSX,                          A_MULSS,                          A_MULSD,                          A_SUBSS,                          A_SUBSD,                          A_ADDSD,                          A_ADDSS,                          A_DIVSD,                          A_DIVSS,                          A_SHLD,                          A_SHRD,                          A_CVTDQ2PD,                          A_CVTDQ2PS,                          A_CVTPD2DQ,                          A_CVTPD2PI,                          A_CVTPD2PS,                          A_CVTPI2PD,                          A_CVTPS2DQ,                          A_CVTPS2PD,                          A_CVTSD2SI,                          A_CVTSD2SS,                          A_CVTSI2SD,                          A_CVTSS2SD,                          A_CVTTPD2PI,                          A_CVTTPD2DQ,                          A_CVTTPS2DQ,                          A_CVTTSD2SI,                          A_CVTPI2PS,                          A_CVTPS2PI,                          A_CVTSI2SS,                          A_CVTSS2SI,                          A_CVTTPS2PI,                          A_CVTTSS2SI,                          A_IMUL,                          A_XORPD,                          A_XORPS,                          A_ORPD,                          A_ORPS,                          A_ANDPD,                          A_ANDPS:                            replaceoper:=-1;{$ifdef x86_64}                          A_MOV:                             { 64 bit constants can only be moved into registers }                             if (oper[0]^.typ=top_const) and                                (oper[1]^.typ=top_reg) and                                ((oper[0]^.val<low(longint)) or                                 (oper[0]^.val>high(longint))) then                               replaceoper:=-1;{$endif x86_64}                        end;                      end;                    end;                end;             end;            {$ifdef x86_64}            { 32 bit operations on 32 bit registers on x86_64 can result in              zeroing the upper 32 bits of the register. This does not happen              with memory operations, so we have to perform these calculations              in registers.  }            if (instr.opsize=S_L) then              replaceoper:=-1;            {$endif x86_64}            { Replace register with spill reference }            if replaceoper<>-1 then              begin                oper[replaceoper]^.typ:=top_ref;                new(oper[replaceoper]^.ref);                oper[replaceoper]^.ref^:=spilltemp;                { memory locations aren't guaranteed to be aligned }                case opcode of                  A_MOVAPS:                    opcode:=A_MOVSS;                  A_MOVAPD:                    opcode:=A_MOVSD;                end;                result:=true;              end;          end;      end;{******************************************************************************                                  Trgx86fpu******************************************************************************}    constructor Trgx86fpu.create;      begin        used_in_proc:=[];        unusedregsfpu:=usableregsfpu;      end;    function trgx86fpu.getregisterfpu(list: TAsmList) : tregister;      begin        { note: don't return R_ST0, see comments above implementation of }        { a_loadfpu_* methods in cgcpu (JM)                              }        result:=NR_ST;      end;    procedure trgx86fpu.ungetregisterfpu(list : TAsmList; r : tregister);      begin        { nothing to do, fpu stack management is handled by the load/ }        { store operations in cgcpu (JM)                              }      end;    function trgx86fpu.correct_fpuregister(r : tregister;ofs : byte) : tregister;      begin        correct_fpuregister:=r;        setsupreg(correct_fpuregister,ofs);      end;    procedure trgx86fpu.saveusedfpuregisters(list: TAsmList;                                             var saved : tpushedsavedfpu;                                             const s: tcpuregisterset);     { var         r : tregister;         hr : treference; }      begin        used_in_proc:=used_in_proc+s;{ TODO: firstsavefpureg}(*        { don't try to save the fpu registers if not desired (e.g. for }        { the 80x86)                                                   }        if firstsavefpureg <> R_NO then          for r.enum:=firstsavefpureg to lastsavefpureg do            begin              saved[r.enum].ofs:=reg_not_saved;              { if the register is used by the calling subroutine and if }              { it's not a regvar (those are handled separately)         }              if not is_reg_var_other[r.enum] and                 (r.enum in s) and                 { and is present in use }                 not(r.enum in unusedregsfpu) then                begin                  { then save it }                  tg.GetTemp(list,extended_size,tt_persistent,hr);                  saved[r.enum].ofs:=hr.offset;                  cg.a_loadfpu_reg_ref(list,OS_FLOAT,OS_FLOAT,r,hr);                  cg.a_reg_dealloc(list,r);                  include(unusedregsfpu,r.enum);                  inc(countunusedregsfpu);                end;            end;*)      end;    procedure trgx86fpu.restoreusedfpuregisters(list : TAsmList;                                                const saved : tpushedsavedfpu);{      var         r,r2 : tregister;         hr : treference;}      begin{ TODO: firstsavefpureg}(*        if firstsavefpureg <> R_NO then          for r.enum:=lastsavefpureg downto firstsavefpureg do            begin              if saved[r.enum].ofs <> reg_not_saved then                begin                  r2.enum:=R_INTREGISTER;                  r2.number:=NR_FRAME_POINTER_REG;                  reference_reset_base(hr,r2,saved[r.enum].ofs);                  cg.a_reg_alloc(list,r);                  cg.a_loadfpu_ref_reg(list,OS_FLOAT,OS_FLOAT,hr,r);                  if not (r.enum in unusedregsfpu) then                    { internalerror(10)                      in n386cal we always save/restore the reg *state*                      using save/restoreunusedstate -> the current state                      may not be real (JM) }                  else                    begin                      dec(countunusedregsfpu);                      exclude(unusedregsfpu,r.enum);                    end;                  tg.UnGetTemp(list,hr);                end;            end;*)      end;(*    procedure Trgx86fpu.saveotherregvars(list: TAsmList; const s: totherregisterset);      var        r: Tregister;      begin        if not(cs_opt_regvar in current_settings.optimizerswitches) then          exit;        if firstsavefpureg <> NR_NO then          for r.enum := firstsavefpureg to lastsavefpureg do            if is_reg_var_other[r.enum] and               (r.enum in s) then              store_regvar(list,r);      end;*)end.
 |