10 年之前 · 0af4f3e3fb
--- a/.gitattributes
+++ b/.gitattributes
@@ -25,6 +25,7 @@ compiler/aarch64/itcpugas.pas svneol=native#text/plain
 
				 compiler/aarch64/ncpuadd.pas svneol=native#text/plain
			
 
				 compiler/aarch64/ncpucnv.pas svneol=native#text/plain
			
 
				 compiler/aarch64/ncpuinl.pas svneol=native#text/plain
			
 
				+compiler/aarch64/ncpumat.pas svneol=native#text/plain
			
 
				 compiler/aarch64/ra64con.inc svneol=native#text/plain
			
 
				 compiler/aarch64/ra64dwa.inc svneol=native#text/plain
			
 
				 compiler/aarch64/ra64nor.inc svneol=native#text/plain
			
--- a/compiler/aarch64/ncpumat.pas
+++ b/compiler/aarch64/ncpumat.pas
@@ -0,0 +1,187 @@
 
				+{
			
 
				+    Copyright (c) 1998-2002, 2014 by Florian Klaempfl and Jonas Maebe
			
 
				+
			
 
				+    Generate AArch64 assembler for math nodes
			
 
				+
			
 
				+    This program is free software; you can redistribute it and/or modify
			
 
				+    it under the terms of the GNU General Public License as published by
			
 
				+    the Free Software Foundation; either version 2 of the License, or
			
 
				+    (at your option) any later version.
			
 
				+
			
 
				+    This program is distributed in the hope that it will be useful,
			
 
				+    but WITHOUT ANY WARRANTY; without even the implied warranty of
			
 
				+    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
			
 
				+    GNU General Public License for more details.
			
 
				+
			
 
				+    You should have received a copy of the GNU General Public License
			
 
				+    along with this program; if not, write to the Free Software
			
 
				+    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
			
 
				+
			
 
				+ ****************************************************************************
			
 
				+}
			
 
				+unit ncpumat;
			
 
				+
			
 
				+{$i fpcdefs.inc}
			
 
				+
			
 
				+interface
			
 
				+
			
 
				+    uses
			
 
				+      node,nmat,ncgmat;
			
 
				+
			
 
				+    type
			
 
				+      taarch64moddivnode = class(tmoddivnode)
			
 
				+         procedure pass_generate_code;override;
			
 
				+      end;
			
 
				+
			
 
				+      taarch64notnode = class(tcgnotnode)
			
 
				+         procedure second_boolean;override;
			
 
				+      end;
			
 
				+
			
 
				+      taarch64unaryminusnode = class(tcgunaryminusnode)
			
 
				+         procedure second_float; override;
			
 
				+      end;
			
 
				+
			
 
				+implementation
			
 
				+
			
 
				+    uses
			
 
				+      globtype,systems,constexp,
			
 
				+      cutils,verbose,globals,
			
 
				+      symconst,symdef,
			
 
				+      aasmbase,aasmcpu,aasmtai,aasmdata,
			
 
				+      defutil,
			
 
				+      cgbase,cgobj,hlcgobj,pass_2,procinfo,
			
 
				+      ncon,
			
 
				+      cpubase,
			
 
				+      ncgutil,cgcpu,cgutils;
			
 
				+
			
 
				+{*****************************************************************************
			
 
				+                             taarch64moddivnode
			
 
				+*****************************************************************************}
			
 
				+
			
 
				+    procedure taarch64moddivnode.pass_generate_code;
			
 
				+      var
			
 
				+         op         : tasmop;
			
 
				+         tmpreg,
			
 
				+         numerator,
			
 
				+         divider,
			
 
				+         resultreg  : tregister;
			
 
				+         hl : tasmlabel;
			
 
				+         overflowloc: tlocation;
			
 
				+      begin
			
 
				+       secondpass(left);
			
 
				+       secondpass(right);
			
 
				+
			
 
				+       { set result location }
			
 
				+       location_reset(location,LOC_REGISTER,def_cgsize(resultdef));
			
 
				+       location.register:=cg.getintregister(current_asmdata.CurrAsmList,def_cgsize(resultdef));
			
 
				+       resultreg:=location.register;
			
 
				+
			
 
				+       { put numerator in register }
			
 
				+       hlcg.location_force_reg(current_asmdata.CurrAsmList,left.location,left.resultdef,left.resultdef,true);
			
 
				+       numerator:=left.location.register;
			
 
				+
			
 
				+       { load divider in a register }
			
 
				+       hlcg.location_force_reg(current_asmdata.CurrAsmList,right.location,right.resultdef,right.resultdef,true);
			
 
				+       divider:=right.location.register;
			
 
				+
			
 
				+       { start division }
			
 
				+       if is_signed(left.resultdef) then
			
 
				+         op:=A_SDIV
			
 
				+       else
			
 
				+         op:=A_UDIV;
			
 
				+       current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(op,location.register,numerator,divider));
			
 
				+
			
 
				+       { no divide-by-zero detection available in hardware, emulate (if it's a
			
 
				+         constant, this will have been detected earlier already) }
			
 
				+       if (right.nodetype<>ordconstn) then
			
 
				+         begin
			
 
				+           current_asmdata.CurrAsmList.concat(taicpu.op_reg_const(A_CMP,
			
 
				+             right.location.register,0));
			
 
				+
			
 
				+           current_asmdata.getjumplabel(hl);
			
 
				+           current_asmdata.CurrAsmList.concat(taicpu.op_cond_sym(A_B,C_NE,hl));
			
 
				+           cg.a_call_name(current_asmdata.CurrAsmList,'FPC_DIVBYZERO',false);
			
 
				+           cg.a_label(current_asmdata.CurrAsmList,hl);
			
 
				+         end;
			
 
				+
			
 
				+       { in case of overflow checking, also check for low(int64) div (-1)
			
 
				+         (no hardware support for this either) }
			
 
				+       if (cs_check_overflow in current_settings.localswitches) and
			
 
				+          is_signed(left.resultdef) and
			
 
				+          ((right.nodetype<>ordconstn) or
			
 
				+           (tordconstnode(right).value=-1)) then
			
 
				+         begin
			
 
				+           { num=ffff... and div=8000... <=>
			
 
				+             num xor not(div xor 8000...) = 0
			
 
				+             (and we have the "eon" operation, which performs "xor not(...)" }
			
 
				+           tmpreg:=hlcg.getintregister(current_asmdata.CurrAsmList,left.resultdef);
			
 
				+           hlcg.a_op_const_reg_reg(current_asmdata.CurrAsmList,OP_XOR,left.resultdef,low(int64),left.location.register,tmpreg);
			
 
				+           current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(A_EON,
			
 
				+             tmpreg,left.location.register,tmpreg));
			
 
				+           current_asmdata.CurrAsmList.concat(taicpu.op_reg_const(A_CMP,tmpreg,0));
			
 
				+           { now the zero/equal flag is set in case we divided low(int64) by
			
 
				+             (-1) }
			
 
				+           location_reset(overflowloc,LOC_FLAGS,OS_NO);
			
 
				+           overflowloc.resflags:=F_EQ;
			
 
				+           cg.g_overflowcheck_loc(current_asmdata.CurrAsmList,location,resultdef,overflowloc);
			
 
				+         end;
			
 
				+
			
 
				+       { in case of modulo, multiply result again by the divider and subtract
			
 
				+         from the numerator }
			
 
				+       if nodetype=modn then
			
 
				+         current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg_reg(A_MSUB,resultreg,
			
 
				+           resultreg,divider,numerator));
			
 
				+    end;
			
 
				+
			
 
				+
			
 
				+{*****************************************************************************
			
 
				+                               taarch64notnode
			
 
				+*****************************************************************************}
			
 
				+
			
 
				+    procedure taarch64notnode.second_boolean;
			
 
				+      begin
			
 
				+        if not handle_locjump then
			
 
				+          begin
			
 
				+            secondpass(left);
			
 
				+            case left.location.loc of
			
 
				+              LOC_FLAGS :
			
 
				+                begin
			
 
				+                  location_copy(location,left.location);
			
 
				+                  inverse_flags(location.resflags);
			
 
				+                end;
			
 
				+              LOC_REGISTER, LOC_CREGISTER,
			
 
				+              LOC_REFERENCE, LOC_CREFERENCE,
			
 
				+              LOC_SUBSETREG, LOC_CSUBSETREG,
			
 
				+              LOC_SUBSETREF, LOC_CSUBSETREF:
			
 
				+                begin
			
 
				+                  hlcg.location_force_reg(current_asmdata.CurrAsmList,left.location,left.resultdef,left.resultdef,true);
			
 
				+                  current_asmdata.CurrAsmList.concat(taicpu.op_reg_const(A_CMP,
			
 
				+                    left.location.register,0));
			
 
				+                  location_reset(location,LOC_FLAGS,OS_NO);
			
 
				+                  location.resflags:=F_EQ;
			
 
				+               end;
			
 
				+              else
			
 
				+                internalerror(2003042401);
			
 
				+            end;
			
 
				+          end;
			
 
				+      end;
			
 
				+
			
 
				+
			
 
				+{*****************************************************************************
			
 
				+                                   taarch64unaryminusnode
			
 
				+*****************************************************************************}
			
 
				+
			
 
				+    procedure taarch64unaryminusnode.second_float;
			
 
				+      begin
			
 
				+        secondpass(left);
			
 
				+        hlcg.location_force_mmregscalar(current_asmdata.CurrAsmList,left.location,left.resultdef,true);
			
 
				+        location_reset(location,LOC_MMREGISTER,def_cgsize(resultdef));
			
 
				+        location.register:=cg.getmmregister(current_asmdata.CurrAsmList,location.size);
			
 
				+        current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_FNEG,location.register,left.location.register));
			
 
				+      end;
			
 
				+
			
 
				+begin
			
 
				+   cmoddivnode:=taarch64moddivnode;
			
 
				+   cnotnode:=taarch64notnode;
			
 
				+   cunaryminusnode:=taarch64unaryminusnode;
			
 
				+end.