6 anni fa · 078595be4c
--- a/compiler/aarch64/cgcpu.pas
+++ b/compiler/aarch64/cgcpu.pas
@@ -100,6 +100,7 @@ interface
 
															         procedure g_concatcopy_move(list: TAsmList; const source, dest: treference; len: tcgint);
														
 
															         procedure g_concatcopy(list: TAsmList; const source, dest: treference; len: tcgint);override;
														
 
															         procedure g_adjust_self_value(list: TAsmList; procdef: tprocdef; ioffset: tcgint);override;
														
 
															+        procedure g_check_for_fpu_exception(list: TAsmList; force, clear: boolean);override;
														
 
															        private
														
 
															         function save_regs(list: TAsmList; rt: tregistertype; lowsr, highsr: tsuperregister; sub: tsubregister): longint;
														
 
															         procedure load_regs(list: TAsmList; rt: tregistertype; lowsr, highsr: tsuperregister; sub: tsubregister);
														
@@ -1032,6 +1033,7 @@ implementation
 
															             instr:=taicpu.op_reg_reg(A_FCVT,reg2,reg1);
														
 
															           end;
														
 
															         list.Concat(instr);
														
 
															+        maybe_check_for_fpu_exception(list);
														
 
															       end;
														
@@ -2256,6 +2258,40 @@ implementation
 
															       end;
														
 
															+    procedure tcgaarch64.g_check_for_fpu_exception(list: TAsmList;force,clear : boolean);
														
 
															+      var
														
 
															+        r : TRegister;
														
 
															+        ai: taicpu;
														
 
															+        l1,l2: TAsmLabel;
														
 
															+      begin
														
 
															+        { so far, we assume all flavours of AArch64 need explicit floating point exception checking }
														
 
															+        if ((cs_check_fpu_exceptions in current_settings.localswitches) and
														
 
															+            (force or current_procinfo.FPUExceptionCheckNeeded)) then
														
 
															+          begin
														
 
															+            r:=getintregister(list,OS_INT);
														
 
															+            list.concat(taicpu.op_reg_reg(A_MRS,r,NR_FPSR));
														
 
															+            list.concat(taicpu.op_reg_const(A_TST,r,$1f));
														
 
															+            current_asmdata.getjumplabel(l1);
														
 
															+            current_asmdata.getjumplabel(l2);
														
 
															+            ai:=taicpu.op_sym(A_B,l1);
														
 
															+            ai.is_jmp:=true;
														
 
															+            ai.condition:=C_NE;
														
 
															+            list.concat(ai);
														
 
															+            list.concat(taicpu.op_reg_const(A_TST,r,$80));
														
 
															+            ai:=taicpu.op_sym(A_B,l2);
														
 
															+            ai.is_jmp:=true;
														
 
															+            ai.condition:=C_EQ;
														
 
															+            list.concat(ai);
														
 
															+            a_label(list,l1);
														
 
															+            alloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
														
 
															+            cg.a_call_name(list,'FPC_THROWFPUEXCEPTION',false);
														
 
															+            dealloccpuregisters(list,R_INTREGISTER,paramanager.get_volatile_registers_int(pocall_default));
														
 
															+            a_label(list,l2);
														
 
															+            if clear then
														
 
															+              current_procinfo.FPUExceptionCheckNeeded:=false;
														
 
															+          end;
														
 
															+      end;
														
 
															+
														
 
															     procedure create_codegen;
														
 
															       begin
														
--- a/compiler/aarch64/ncpuadd.pas
+++ b/compiler/aarch64/ncpuadd.pas
@@ -218,6 +218,7 @@ interface
 
															         current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(op,
														
 
															            location.register,left.location.register,right.location.register));
														
 
															+        cg.maybe_check_for_fpu_exception(current_asmdata.CurrAsmList);
														
 
															       end;
														
@@ -238,6 +239,7 @@ interface
 
															         { signalling compare so we can get exceptions }
														
 
															         current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_FCMPE,
														
 
															              left.location.register,right.location.register));
														
 
															+        cg.maybe_check_for_fpu_exception(current_asmdata.CurrAsmList);
														
 
															       end;
														
--- a/compiler/aarch64/ncpuinl.pas
+++ b/compiler/aarch64/ncpuinl.pas
@@ -122,6 +122,7 @@ implementation
 
															       begin
														
 
															         load_fpu_location;
														
 
															         current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_FABS,location.register,left.location.register));
														
 
															+        cg.maybe_check_for_fpu_exception(current_asmdata.CurrAsmList);
														
 
															       end;
														
@@ -129,6 +130,7 @@ implementation
 
															       begin
														
 
															         load_fpu_location;
														
 
															         current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(A_FMUL,location.register,left.location.register,left.location.register));
														
 
															+        cg.maybe_check_for_fpu_exception(current_asmdata.CurrAsmList);
														
 
															       end;
														
@@ -136,6 +138,7 @@ implementation
 
															       begin
														
 
															         load_fpu_location;
														
 
															         current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_FSQRT,location.register,left.location.register));
														
 
															+        cg.maybe_check_for_fpu_exception(current_asmdata.CurrAsmList);
														
 
															       end;
														
@@ -168,6 +171,7 @@ implementation
 
															         { convert to signed integer rounding towards zero (there's no "round to
														
 
															           integer using current rounding mode") }
														
 
															         current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_FCVTZS,location.register,hreg));
														
 
															+        cg.maybe_check_for_fpu_exception(current_asmdata.CurrAsmList);
														
 
															       end;
														
--- a/compiler/aarch64/ncpumat.pas
+++ b/compiler/aarch64/ncpumat.pas
@@ -187,6 +187,7 @@ implementation
 
															         location_reset(location,LOC_MMREGISTER,def_cgsize(resultdef));
														
 
															         location.register:=cg.getmmregister(current_asmdata.CurrAsmList,location.size);
														
 
															         current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_FNEG,location.register,left.location.register));
														
 
															+        cg.maybe_check_for_fpu_exception(current_asmdata.CurrAsmList);
														
 
															       end;
														
 
															 begin
														
--- a/rtl/aarch64/aarch64.inc
+++ b/rtl/aarch64/aarch64.inc
@@ -57,14 +57,80 @@ procedure setfpsr(val: dword); nostackframe; assembler;
 
															   end;
														
 
															+const
														
 
															+  FPSR_IOC = 1;
														
 
															+  FPSR_DZC = 1 shl 1;
														
 
															+  FPSR_OFC = 1 shl 2;
														
 
															+  FPSR_UFC = 1 shl 3;
														
 
															+  FPSR_IXC = 1 shl 4;
														
 
															+  FPSR_IDC = 1 shl 7;
														
 
															+  FPSR_EXCEPTIONS = FPSR_IOC or FPSR_DZC or FPSR_OFC or FPSR_UFC or FPSR_IXC or FPSR_IDC;
														
 
															+
														
 
															+
														
 
															+procedure RaisePendingExceptions;
														
 
															+  var
														
 
															+    fpsr : dword;
														
 
															+    f: TFPUException;
														
 
															+  begin
														
 
															+    fpsr:=getfpsr;
														
 
															+    if (fpsr and FPSR_DZC) <> 0 then
														
 
															+      float_raise(exZeroDivide);
														
 
															+    if (fpsr and FPSR_OFC) <> 0 then
														
 
															+      float_raise(exOverflow);
														
 
															+    if (fpsr and FPSR_UFC) <> 0 then
														
 
															+      float_raise(exUnderflow);
														
 
															+    if (fpsr and FPSR_IOC) <> 0 then
														
 
															+      float_raise(exInvalidOp);
														
 
															+    if (fpsr and FPSR_IXC) <> 0 then
														
 
															+      float_raise(exPrecision);
														
 
															+    if (fpsr and FPSR_IDC) <> 0 then
														
 
															+      float_raise(exDenormalized);
														
 
															+    { now the soft float exceptions }
														
 
															+    for f in softfloat_exception_flags do
														
 
															+      float_raise(f);
														
 
															+  end;
														
 
															+
														
 
															+
														
 
															+{ as so far no AArch64 flavour which supports hard floating point exceptions, we use solely
														
 
															+  the softfloat_exception_mask for masking as the masking flags are RAZ and WI if floating point
														
 
															+  exceptions are not supported }
														
 
															+procedure fpc_throwfpuexception;[public,alias:'FPC_THROWFPUEXCEPTION'];
														
 
															+  var
														
 
															+    fpsr : dword;
														
 
															+    f: TFPUException;
														
 
															+  begin
														
 
															+    { at this point, we know already, that an exception will be risen }
														
 
															+    fpsr:=getfpsr;
														
 
															+
														
 
															+    { check, if the exception is masked }
														
 
															+    if ((fpsr and FPSR_DZC) <> 0) and (exZeroDivide in softfloat_exception_mask) then
														
 
															+      fpsr:=fpsr and not(FPSR_DZC);
														
 
															+    if ((fpsr and FPSR_OFC) <> 0) and (exOverflow in softfloat_exception_mask) then
														
 
															+      fpsr:=fpsr and not(FPSR_OFC);
														
 
															+    if ((fpsr and FPSR_UFC) <> 0) and (exUnderflow in softfloat_exception_mask) then
														
 
															+      fpsr:=fpsr and not(FPSR_UFC);
														
 
															+    if ((fpsr and FPSR_IOC) <> 0) and (exInvalidOp in softfloat_exception_mask) then
														
 
															+      fpsr:=fpsr and not(FPSR_IOC);
														
 
															+    if ((fpsr and FPSR_IXC) <> 0) and (exPrecision in softfloat_exception_mask) then
														
 
															+      fpsr:=fpsr and not(FPSR_IXC);
														
 
															+    if ((fpsr and FPSR_IDC) <> 0) and (exDenormalized in softfloat_exception_mask) then
														
 
															+      fpsr:=fpsr and not(FPSR_IDC);
														
 
															+    setfpsr(fpsr);
														
 
															+    if (fpsr and FPSR_EXCEPTIONS)<>0 then
														
 
															+      RaisePendingExceptions;
														
 
															+  end;
														
 
															+
														
 
															+
														
 
															 procedure fpc_enable_fpu_exceptions;
														
 
															   begin
														
 
															     { clear all "exception happened" flags we care about}
														
 
															     setfpsr(getfpsr and not(fpu_exception_mask shr fpu_exception_mask_to_status_mask_shift));
														
 
															     { enable invalid operations and division by zero exceptions. }
														
 
															-    setfpcr(getfpcr or fpu_exception_mask);
														
 
															+    setfpcr((getfpcr and not(fpu_exception_mask)));
														
 
															+    softfloat_exception_mask:=[exPrecision,exUnderflow,exInvalidOp];
														
 
															   end;
														
 
															+
														
 
															 procedure fpc_cpuinit;
														
 
															   begin
														
 
															     { don't let libraries influence the FPU cw set by the host program }
														
--- a/rtl/aarch64/math.inc
+++ b/rtl/aarch64/math.inc
@@ -1,5 +1,5 @@
 
															 {
														
 
															-    Implementation of mathematical routines for x86_64
														
 
															+    Implementation of mathematical routines for AArch64
														
 
															     This file is part of the Free Pascal run time library.
														
 
															     Copyright (c) 1999-2005 by the Free Pascal development team
														
--- a/rtl/aarch64/mathu.inc
+++ b/rtl/aarch64/mathu.inc
@@ -80,9 +80,14 @@ const
 
															 function GetExceptionMask: TFPUExceptionMask;
														
 
															+  {
														
 
															   var
														
 
															     fpcr: dword;
														
 
															+  }
														
 
															   begin
														
 
															+    { as I am not aware of any hardware exception supporting AArch64 implementation,
														
 
															+      and else the trapping enable flags are RAZ, return the softfloat exception mask (FK)
														
 
															+
														
 
															     fpcr:=getfpcr;
														
 
															     result:=[];
														
 
															     if ((fpcr and fpu_ioe)=0) then
														
@@ -97,14 +102,22 @@ function GetExceptionMask: TFPUExceptionMask;
 
															       result := result+[exPrecision];
														
 
															     if ((fpcr and fpu_ide)=0) then
														
 
															       result := result+[exDenormalized];
														
 
															+    }
														
 
															+    result:=softfloat_exception_mask;
														
 
															   end;
														
 
															 function SetExceptionMask(const Mask: TFPUExceptionMask): TFPUExceptionMask;
														
 
															+  {
														
 
															   var
														
 
															     newfpcr: dword;
														
 
															+  }
														
 
															   begin
														
 
															+    { as I am not aware of any hardware exception supporting AArch64 implementation,
														
 
															+      and else the trapping enable flags are RAZ, work solely with softfloat_exception_mask (FK)
														
 
															+    }
														
 
															     softfloat_exception_mask:=mask;
														
 
															+    {
														
 
															     newfpcr:=fpu_exception_mask;
														
 
															     if exInvalidOp in Mask then
														
 
															       newfpcr:=newfpcr and not(fpu_ioe);
														
@@ -118,13 +131,15 @@ function SetExceptionMask(const Mask: TFPUExceptionMask): TFPUExceptionMask;
 
															       newfpcr:=newfpcr and not(fpu_ixe);
														
 
															     if exDenormalized in Mask then
														
 
															       newfpcr:=newfpcr and not(fpu_ide);
														
 
															+    }
														
 
															     { clear "exception happened" flags }
														
 
															     ClearExceptions(false);
														
 
															     { set new exception mask }
														
 
															-    setfpcr((getfpcr and not(fpu_exception_mask)) or newfpcr);
														
 
															+//    setfpcr((getfpcr and not(fpu_exception_mask)) or newfpcr);
														
 
															     { unsupported mask bits will remain 0 -> read exception mask again }
														
 
															-    result:=GetExceptionMask;
														
 
															-    softfloat_exception_mask:=result;
														
 
															+//    result:=GetExceptionMask;
														
 
															+//    softfloat_exception_mask:=result;
														
 
															+    result:=softfloat_exception_mask;
														
 
															   end;