| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411 | {    Copyright (c) 2014 Jonas Maebe    Code generation for add nodes on AArch64    This program is free software; you can redistribute it and/or modify    it under the terms of the GNU General Public License as published by    the Free Software Foundation; either version 2 of the License, or    (at your option) any later version.    This program is distributed in the hope that it will be useful,    but WITHOUT ANY WARRANTY; without even the implied warranty of    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the    GNU General Public License for more details.    You should have received a copy of the GNU General Public License    along with this program; if not, write to the Free Software    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. ****************************************************************************}unit ncpuadd;{$i fpcdefs.inc}interface    uses       node,ncgadd,cpubase;    type       taarch64addnode = class(tcgaddnode)       private          function  GetResFlags(unsigned:Boolean):TResFlags;          function  GetFPUResFlags:TResFlags;       protected          function use_fma : boolean;override;          procedure second_addfloat;override;          procedure second_cmpfloat;override;          procedure second_cmpboolean;override;          procedure second_cmpsmallset;override;          procedure second_cmpordinal;override;          procedure second_addordinal;override;          procedure second_add64bit; override;          procedure second_cmp64bit; override;       public          function use_generic_mul32to64: boolean; override;       end;  implementation    uses      systems,      cutils,verbose,      paramgr,procinfo,      aasmtai,aasmdata,aasmcpu,defutil,      cgbase,cgcpu,cgutils,      cpupara,      ncon,nset,nadd,      hlcgobj, ncgutil,cgobj;{*****************************************************************************                               taarch64addnode*****************************************************************************}    function taarch64addnode.use_fma : boolean;      begin        Result:=true;      end;    function taarch64addnode.GetResFlags(unsigned:Boolean):TResFlags;      begin        case NodeType of          equaln:            GetResFlags:=F_EQ;          unequaln:            GetResFlags:=F_NE;          else            if not(unsigned) then              begin                if nf_swapped in flags then                  case NodeType of                    ltn:                      GetResFlags:=F_GT;                    lten:                      GetResFlags:=F_GE;                    gtn:                      GetResFlags:=F_LT;                    gten:                      GetResFlags:=F_LE;                    else                      internalerror(2014082010);                  end                else                  case NodeType of                    ltn:                      GetResFlags:=F_LT;                    lten:                      GetResFlags:=F_LE;                    gtn:                      GetResFlags:=F_GT;                    gten:                      GetResFlags:=F_GE;                    else                      internalerror(2014082011);                  end;              end            else              begin                if nf_swapped in Flags then                  case NodeType of                    ltn:                      GetResFlags:=F_HI;                    lten:                      GetResFlags:=F_HS;                    gtn:                      GetResFlags:=F_LO;                    gten:                      GetResFlags:=F_LS;                    else                      internalerror(2014082012);                  end                else                  case NodeType of                    ltn:                      GetResFlags:=F_LO;                    lten:                      GetResFlags:=F_LS;                    gtn:                      GetResFlags:=F_HI;                    gten:                      GetResFlags:=F_HS;                    else                      internalerror(2014082013);                  end;              end;        end;      end;    function taarch64addnode.GetFPUResFlags:TResFlags;      begin        case NodeType of          equaln:            result:=F_EQ;          unequaln:            result:=F_NE;          else            begin              if nf_swapped in Flags then                case NodeType of                  ltn:                    result:=F_GT;                  lten:                    result:=F_GE;                  gtn:                    result:=F_LO;                  gten:                    result:=F_LS;                  else                    internalerror(2014082014);                end              else                case NodeType of                  ltn:                    result:=F_LO;                  lten:                    result:=F_LS;                  gtn:                    result:=F_GT;                  gten:                    result:=F_GE;                  else                    internalerror(2014082015);                end;            end;        end;      end;    procedure taarch64addnode.second_addfloat;      var        op : TAsmOp;      begin        pass_left_right;        if nf_swapped in flags then          swapleftright;        { force fpureg as location, left right doesn't matter          as both will be in a fpureg }        hlcg.location_force_mmregscalar(current_asmdata.CurrAsmList,left.location,left.resultdef,true);        hlcg.location_force_mmregscalar(current_asmdata.CurrAsmList,right.location,right.resultdef,true);        location_reset(location,LOC_MMREGISTER,def_cgsize(resultdef));        location.register:=cg.getmmregister(current_asmdata.CurrAsmList,location.size);        case nodetype of          addn :            begin              op:=A_FADD;            end;          muln :            begin              op:=A_FMUL;            end;          subn :            begin              op:=A_FSUB;            end;          slashn :            begin              op:=A_FDIV;            end;          else            internalerror(200306014);        end;        current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(op,           location.register,left.location.register,right.location.register));        cg.maybe_check_for_fpu_exception(current_asmdata.CurrAsmList);      end;    procedure taarch64addnode.second_cmpfloat;      begin        pass_left_right;        if nf_swapped in flags then          swapleftright;        { force fpureg as location, left right doesn't matter          as both will be in a fpureg }        hlcg.location_force_mmregscalar(current_asmdata.CurrAsmList,left.location,left.resultdef,true);        hlcg.location_force_mmregscalar(current_asmdata.CurrAsmList,right.location,right.resultdef,true);        location_reset(location,LOC_FLAGS,OS_NO);        location.resflags:=getfpuresflags;        { signalling compare so we can get exceptions }        current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_FCMPE,             left.location.register,right.location.register));        cg.maybe_check_for_fpu_exception(current_asmdata.CurrAsmList);      end;    procedure taarch64addnode.second_cmpboolean;      begin        pass_left_right;        force_reg_left_right(true,true);        if right.location.loc=LOC_CONSTANT then          begin            if right.location.value>=0 then              Tcgaarch64(cg).handle_reg_imm12_reg(current_asmdata.CurrAsmList,A_CMP,left.location.size,left.location.register,right.location.value,NR_XZR,NR_NO,false,false)            else              { avoid overflow if value=low(int64) }{$push}{$r-}{$q-}              Tcgaarch64(cg).handle_reg_imm12_reg(current_asmdata.CurrAsmList,A_CMN,left.location.size,left.location.register,-right.location.value,NR_XZR,NR_NO,false,false){$pop}          end        else          current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_CMP,left.location.register,right.location.register));        location_reset(location,LOC_FLAGS,OS_NO);        location.resflags:=getresflags(true);      end;    procedure taarch64addnode.second_cmpsmallset;      var        tmpreg : tregister;        op: tasmop;      begin        pass_left_right;        location_reset(location,LOC_FLAGS,OS_NO);        force_reg_left_right(true,true);        if right.location.loc=LOC_CONSTANT then          begin            { when doing a cmp/cmn on 32 bit, we care whether the *lower 32 bit*              is a positive/negative value -> sign extend }            if not(right.location.size in [OS_64,OS_S64]) then              right.location.value:=longint(right.location.value);            if right.location.value>=0 then              op:=A_CMP            else              op:=A_CMN;          end        else          { for DFA }          op:=A_NONE;        case nodetype of          equaln,          unequaln:            begin              if right.location.loc=LOC_CONSTANT then                tcgaarch64(cg).handle_reg_imm12_reg(current_asmdata.CurrAsmList,op,def_cgsize(resultdef),left.location.register,abs(right.location.value),NR_XZR,NR_NO,false,false)              else                current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_CMP,left.location.register,right.location.register));              location.resflags:=getresflags(true);            end;          lten,          gten:            begin              if (not(nf_swapped in flags) and                  (nodetype=lten)) or                 ((nf_swapped in flags) and                  (nodetype=gten)) then                swapleftright;              { we can't handle left as a constant yet }              if left.location.loc=LOC_CONSTANT then                hlcg.location_force_reg(current_asmdata.CurrAsmList,left.location,left.resultdef,left.resultdef,true);              tmpreg:=cg.getintregister(current_asmdata.CurrAsmList,left.location.size);              if right.location.loc=LOC_CONSTANT then                begin                  hlcg.a_op_const_reg_reg(current_asmdata.CurrAsmList,OP_AND,resultdef,right.location.value,left.location.register,tmpreg);                  tcgaarch64(cg).handle_reg_imm12_reg(current_asmdata.CurrAsmList,op,def_cgsize(resultdef),tmpreg,abs(right.location.value),NR_XZR,NR_NO,false,false)                end              else                begin                  current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(A_AND,tmpreg,left.location.register,right.location.register));                  current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_CMP,tmpreg,right.location.register));                end;              location.resflags:=F_EQ;            end;          else            internalerror(2012042701);        end;      end;    procedure taarch64addnode.second_cmpordinal;      var        unsigned : boolean;      begin        pass_left_right;        force_reg_left_right(true,true);        unsigned:=not(is_signed(left.resultdef)) or                  not(is_signed(right.resultdef));        if right.location.loc = LOC_CONSTANT then          begin            if right.location.value>=0 then              Tcgaarch64(cg).handle_reg_imm12_reg(current_asmdata.CurrAsmList,A_CMP,left.location.size,left.location.register,right.location.value,NR_XZR,NR_NO,false,false)            else{$push}{$r-}{$q-}              Tcgaarch64(cg).handle_reg_imm12_reg(current_asmdata.CurrAsmList,A_CMN,left.location.size,left.location.register,-right.location.value,NR_XZR,NR_NO,false,false){$pop}          end        else          current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_CMP,left.location.register,right.location.register));        location_reset(location,LOC_FLAGS,OS_NO);        location.resflags:=getresflags(unsigned);      end;    procedure taarch64addnode.second_addordinal;      const        multops: array[boolean] of TAsmOp = (A_SMULL,A_UMULL);      var        unsigned: boolean;      begin        { 32x32->64 multiplication }        if (nodetype=muln) and           is_32bit(left.resultdef) and           is_32bit(right.resultdef) and           is_64bit(resultdef) then          begin            unsigned:=not(is_signed(left.resultdef)) or                      not(is_signed(right.resultdef));            pass_left_right;            force_reg_left_right(true,true);            { force_reg_left_right can leave right as a LOC_CONSTANT (we can't              say "a constant register is okay, but an ordinal constant isn't) }            if right.location.loc=LOC_CONSTANT then              hlcg.location_force_reg(current_asmdata.CurrAsmList,right.location,right.resultdef,right.resultdef,true);            location_reset(location,LOC_REGISTER,def_cgsize(resultdef));            location.register:=cg.getintregister(current_asmdata.CurrAsmList,def_cgsize(resultdef));            current_asmdata.CurrAsmList.Concat(taicpu.op_reg_reg_reg(multops[unsigned],location.register,left.location.register,right.location.register));          end        else          inherited second_addordinal;      end;    procedure taarch64addnode.second_add64bit;      begin        second_addordinal;      end;    procedure taarch64addnode.second_cmp64bit;      begin        second_cmpordinal;      end;    function taarch64addnode.use_generic_mul32to64: boolean;      begin        result:=false;      end;begin  caddnode:=taarch64addnode;end.
 |