19 ani în urmă · 454120a504
--- a/rtl/inc/softfpu.pp
+++ b/rtl/inc/softfpu.pp
@@ -28,6 +28,39 @@ Derivative works are acceptable, even for commercial purposes, so long as
 
				 include prominent notice akin to these four paragraphs for those parts of
			
 
				 this code that are retained.
			
 
				 
			
 
				+===============================================================================
			
 
				+The float80 and float128 part is translated from the softfloat package
			
 
				+by Florian Klaempfl and contained the following copyright notice
			
 
				+===============================================================================
			
 
				+
			
 
				+This C source file is part of the SoftFloat IEC/IEEE Floating-point Arithmetic
			
 
				+Package, Release 2b.
			
 
				+
			
 
				+Written by John R. Hauser.  This work was made possible in part by the
			
 
				+International Computer Science Institute, located at Suite 600, 1947 Center
			
 
				+Street, Berkeley, California 94704.  Funding was partially provided by the
			
 
				+National Science Foundation under grant MIP-9311980.  The original version
			
 
				+of this code was written as part of a project to build a fixed-point vector
			
 
				+processor in collaboration with the University of California at Berkeley,
			
 
				+overseen by Profs. Nelson Morgan and John Wawrzynek.  More information
			
 
				+is available through the Web page `http://www.cs.berkeley.edu/~jhauser/
			
 
				+arithmetic/SoftFloat.html'.
			
 
				+
			
 
				+THIS SOFTWARE IS DISTRIBUTED AS IS, FOR FREE.  Although reasonable effort has
			
 
				+been made to avoid it, THIS SOFTWARE MAY CONTAIN FAULTS THAT WILL AT TIMES
			
 
				+RESULT IN INCORRECT BEHAVIOR.  USE OF THIS SOFTWARE IS RESTRICTED TO PERSONS
			
 
				+AND ORGANIZATIONS WHO CAN AND WILL TAKE FULL RESPONSIBILITY FOR ALL LOSSES,
			
 
				+COSTS, OR OTHER PROBLEMS THEY INCUR DUE TO THE SOFTWARE, AND WHO FURTHERMORE
			
 
				+EFFECTIVELY INDEMNIFY JOHN HAUSER AND THE INTERNATIONAL COMPUTER SCIENCE
			
 
				+INSTITUTE (possibly via similar legal warning) AGAINST ALL LOSSES, COSTS, OR
			
 
				+OTHER PROBLEMS INCURRED BY THEIR CUSTOMERS AND CLIENTS DUE TO THE SOFTWARE.
			
 
				+
			
 
				+Derivative works are acceptable, even for commercial purposes, so long as
			
 
				+(1) the source code for the derivative work includes prominent notice that
			
 
				+the work is derivative, and (2) the source code includes prominent notice with
			
 
				+these four paragraphs for those parts of this code that are retained.
			
 
				+
			
 
				+
			
 
				 ===============================================================================
			
 
				 *}
			
 
				 
			
@@ -4658,6 +4691,2121 @@ Begin
 
				     int64_to_float64:= float_result;
			
 
				 End;
			
 
				 
			
 
				+
			
 
				+{$ifdef FPC_SOFTFLOAT_FLOATX80}
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the extended double-precision floating-
			
 
				+| point value `a' to the 32-bit two's complement integer format.  The
			
 
				+| conversion is performed according to the IEC/IEEE Standard for Binary
			
 
				+| Floating-Point Arithmetic---which means in particular that the conversion
			
 
				+| is rounded according to the current rounding mode.  If `a' is a NaN, the
			
 
				+| largest positive integer is returned.  Otherwise, if the conversion
			
 
				+| overflows, the largest integer with the same sign as `a' is returned.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_to_int32(a: floatx80): int32;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp, shiftCount;
			
 
				+    bits64 aSig;
			
 
				+
			
 
				+    aSig := extractFloatx80Frac( a );
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    if ( ( aExp = $7FFF ) and (bits64) ( aSig shl 1 ) ) aSign := 0;
			
 
				+    shiftCount := $4037 - aExp;
			
 
				+    if ( shiftCount <= 0 ) shiftCount := 1;
			
 
				+    shift64RightJamming( aSig, shiftCount, &aSig );
			
 
				+    result := roundAndPackInt32( aSign, aSig );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the extended double-precision floating-
			
 
				+| point value `a' to the 32-bit two's complement integer format.  The
			
 
				+| conversion is performed according to the IEC/IEEE Standard for Binary
			
 
				+| Floating-Point Arithmetic, except that the conversion is always rounded
			
 
				+| toward zero.  If `a' is a NaN, the largest positive integer is returned.
			
 
				+| Otherwise, if the conversion overflows, the largest integer with the same
			
 
				+| sign as `a' is returned.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_to_int32_round_to_zero(a: floatx80): int32;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp, shiftCount;
			
 
				+    bits64 aSig, savedASig;
			
 
				+    int32 z;
			
 
				+
			
 
				+    aSig := extractFloatx80Frac( a );
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    if ( $401E < aExp ) begin
			
 
				+        if ( ( aExp = $7FFF ) and (bits64) ( aSig shl 1 ) ) aSign := 0;
			
 
				+        goto invalid;
			
 
				+    end;
			
 
				+    else if ( aExp < $3FFF ) begin
			
 
				+        if ( aExp or aSig ) float_exception_flags or= float_flag_inexact;
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    shiftCount := $403E - aExp;
			
 
				+    savedASig := aSig;
			
 
				+    aSig >>= shiftCount;
			
 
				+    z := aSig;
			
 
				+    if ( aSign ) z := - z;
			
 
				+    if ( ( z < 0 ) xor aSign ) begin
			
 
				+ invalid:
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        result := aSign ? (sbits32) $80000000 : $7FFFFFFF;
			
 
				+    end;
			
 
				+    if ( ( aSig shl shiftCount ) <> savedASig ) begin
			
 
				+        float_exception_flags or= float_flag_inexact;
			
 
				+    end;
			
 
				+    result := z;
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the extended double-precision floating-
			
 
				+| point value `a' to the 64-bit two's complement integer format.  The
			
 
				+| conversion is performed according to the IEC/IEEE Standard for Binary
			
 
				+| Floating-Point Arithmetic---which means in particular that the conversion
			
 
				+| is rounded according to the current rounding mode.  If `a' is a NaN,
			
 
				+| the largest positive integer is returned.  Otherwise, if the conversion
			
 
				+| overflows, the largest integer with the same sign as `a' is returned.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_to_int64(a: floatx80): int64;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp, shiftCount;
			
 
				+    bits64 aSig, aSigExtra;
			
 
				+
			
 
				+    aSig := extractFloatx80Frac( a );
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    shiftCount := $403E - aExp;
			
 
				+    if ( shiftCount <= 0 ) begin
			
 
				+        if ( shiftCount ) begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            if (    ! aSign
			
 
				+                 or (    ( aExp = $7FFF )
			
 
				+                      and ( aSig <> LIT64( $8000000000000000 ) ) )
			
 
				+               ) begin
			
 
				+                result := LIT64( $7FFFFFFFFFFFFFFF );
			
 
				+            end;
			
 
				+            result := (sbits64) LIT64( $8000000000000000 );
			
 
				+        end;
			
 
				+        aSigExtra := 0;
			
 
				+    end;
			
 
				+    else begin
			
 
				+        shift64ExtraRightJamming( aSig, 0, shiftCount, &aSig, &aSigExtra );
			
 
				+    end;
			
 
				+    result := roundAndPackInt64( aSign, aSig, aSigExtra );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the extended double-precision floating-
			
 
				+| point value `a' to the 64-bit two's complement integer format.  The
			
 
				+| conversion is performed according to the IEC/IEEE Standard for Binary
			
 
				+| Floating-Point Arithmetic, except that the conversion is always rounded
			
 
				+| toward zero.  If `a' is a NaN, the largest positive integer is returned.
			
 
				+| Otherwise, if the conversion overflows, the largest integer with the same
			
 
				+| sign as `a' is returned.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_to_int64_round_to_zero(a: floatx80): int64;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp, shiftCount;
			
 
				+    bits64 aSig;
			
 
				+    int64 z;
			
 
				+
			
 
				+    aSig := extractFloatx80Frac( a );
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    shiftCount := aExp - $403E;
			
 
				+    if ( 0 <= shiftCount ) begin
			
 
				+        aSig &= LIT64( $7FFFFFFFFFFFFFFF );
			
 
				+        if ( ( a.high <> $C03E ) or aSig ) begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            if ( ! aSign or ( ( aExp = $7FFF ) and aSig ) ) begin
			
 
				+                result := LIT64( $7FFFFFFFFFFFFFFF );
			
 
				+            end;
			
 
				+        end;
			
 
				+        result := (sbits64) LIT64( $8000000000000000 );
			
 
				+    end;
			
 
				+    else if ( aExp < $3FFF ) begin
			
 
				+        if ( aExp or aSig ) float_exception_flags or= float_flag_inexact;
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    z := aSig>>( - shiftCount );
			
 
				+    if ( (bits64) ( aSig shl ( shiftCount and 63 ) ) ) begin
			
 
				+        float_exception_flags or= float_flag_inexact;
			
 
				+    end;
			
 
				+    if ( aSign ) z := - z;
			
 
				+    result := z;
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the extended double-precision floating-
			
 
				+| point value `a' to the single-precision floating-point format.  The
			
 
				+| conversion is performed according to the IEC/IEEE Standard for Binary
			
 
				+| Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_to_float32(a: floatx80): float32;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp;
			
 
				+    bits64 aSig;
			
 
				+
			
 
				+    aSig := extractFloatx80Frac( a );
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if ( (bits64) ( aSig shl 1 ) ) begin
			
 
				+            result := commonNaNToFloat32( floatx80ToCommonNaN( a ) );
			
 
				+        end;
			
 
				+        result := packFloat32( aSign, $FF, 0 );
			
 
				+    end;
			
 
				+    shift64RightJamming( aSig, 33, &aSig );
			
 
				+    if ( aExp or aSig ) aExp -= $3F81;
			
 
				+    result := roundAndPackFloat32( aSign, aExp, aSig );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the extended double-precision floating-
			
 
				+| point value `a' to the double-precision floating-point format.  The
			
 
				+| conversion is performed according to the IEC/IEEE Standard for Binary
			
 
				+| Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_to_float64(a: floatx80): float64;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp;
			
 
				+    bits64 aSig, zSig;
			
 
				+
			
 
				+    aSig := extractFloatx80Frac( a );
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if ( (bits64) ( aSig shl 1 ) ) begin
			
 
				+            result := commonNaNToFloat64( floatx80ToCommonNaN( a ) );
			
 
				+        end;
			
 
				+        result := packFloat64( aSign, $7FF, 0 );
			
 
				+    end;
			
 
				+    shift64RightJamming( aSig, 1, &zSig );
			
 
				+    if ( aExp or aSig ) aExp -= $3C01;
			
 
				+    result := roundAndPackFloat64( aSign, aExp, zSig );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{$ifdef FPC_SOFTFLOAT_FLOAT128}
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the extended double-precision floating-
			
 
				+| point value `a' to the quadruple-precision floating-point format.  The
			
 
				+| conversion is performed according to the IEC/IEEE Standard for Binary
			
 
				+| Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_to_float128(a: floatx80): float128;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int16 aExp;
			
 
				+    bits64 aSig, zSig0, zSig1;
			
 
				+
			
 
				+    aSig := extractFloatx80Frac( a );
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    if ( ( aExp = $7FFF ) and (bits64) ( aSig shl 1 ) ) begin
			
 
				+        result := commonNaNToFloat128( floatx80ToCommonNaN( a ) );
			
 
				+    end;
			
 
				+    shift128Right( aSig shl 1, 0, 16, &zSig0, &zSig1 );
			
 
				+    result := packFloat128( aSign, aExp, zSig0, zSig1 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{$endif FPC_SOFTFLOAT_FLOAT128}
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Rounds the extended double-precision floating-point value `a' to an integer,
			
 
				+| and Returns the result as an extended quadruple-precision floating-point
			
 
				+| value.  The operation is performed according to the IEC/IEEE Standard for
			
 
				+| Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_round_to_int(a: floatx80): floatx80;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp;
			
 
				+    bits64 lastBitMask, roundBitsMask;
			
 
				+    int8 roundingMode;
			
 
				+    floatx80 z;
			
 
				+
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    if ( $403E <= aExp ) begin
			
 
				+        if ( ( aExp = $7FFF ) and (bits64) ( extractFloatx80Frac( a ) shl 1 ) ) begin
			
 
				+            result := propagateFloatx80NaN( a, a );
			
 
				+        end;
			
 
				+        result := a;
			
 
				+    end;
			
 
				+    if ( aExp < $3FFF ) begin
			
 
				+        if (    ( aExp = 0 )
			
 
				+             and ( (bits64) ( extractFloatx80Frac( a ) shl 1 ) = 0 ) ) begin
			
 
				+            result := a;
			
 
				+        end;
			
 
				+        float_exception_flags or= float_flag_inexact;
			
 
				+        aSign := extractFloatx80Sign( a );
			
 
				+        switch ( float_rounding_mode ) begin
			
 
				+         case float_round_nearest_even:
			
 
				+            if ( ( aExp = $3FFE ) and (bits64) ( extractFloatx80Frac( a ) shl 1 )
			
 
				+               ) begin
			
 
				+                result :=
			
 
				+                    packFloatx80( aSign, $3FFF, LIT64( $8000000000000000 ) );
			
 
				+            end;
			
 
				+            break;
			
 
				+         case float_round_down:
			
 
				+            result :=
			
 
				+                  aSign ?
			
 
				+                      packFloatx80( 1, $3FFF, LIT64( $8000000000000000 ) )
			
 
				+                : packFloatx80( 0, 0, 0 );
			
 
				+         case float_round_up:
			
 
				+            result :=
			
 
				+                  aSign ? packFloatx80( 1, 0, 0 )
			
 
				+                : packFloatx80( 0, $3FFF, LIT64( $8000000000000000 ) );
			
 
				+        end;
			
 
				+        result := packFloatx80( aSign, 0, 0 );
			
 
				+    end;
			
 
				+    lastBitMask := 1;
			
 
				+    lastBitMask  shl = $403E - aExp;
			
 
				+    roundBitsMask := lastBitMask - 1;
			
 
				+    z := a;
			
 
				+    roundingMode := float_rounding_mode;
			
 
				+    if ( roundingMode = float_round_nearest_even ) begin
			
 
				+        z.low += lastBitMask>>1;
			
 
				+        if ( ( z.low and roundBitsMask ) = 0 ) z.low &= ~ lastBitMask;
			
 
				+    end;
			
 
				+    else if ( roundingMode <> float_round_to_zero ) begin
			
 
				+        if ( extractFloatx80Sign( z ) xor ( roundingMode = float_round_up ) ) begin
			
 
				+            z.low += roundBitsMask;
			
 
				+        end;
			
 
				+    end;
			
 
				+    z.low &= ~ roundBitsMask;
			
 
				+    if ( z.low = 0 ) begin
			
 
				+        ++z.high;
			
 
				+        z.low := LIT64( $8000000000000000 );
			
 
				+    end;
			
 
				+    if ( z.low <> a.low ) float_exception_flags or= float_flag_inexact;
			
 
				+    result := z;
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of adding the absolute values of the extended double-
			
 
				+| precision floating-point values `a' and `b'.  If `zSign' is 1, the sum is
			
 
				+| negated before being returned.  `zSign' is ignored if the result is a NaN.
			
 
				+| The addition is performed according to the IEC/IEEE Standard for Binary
			
 
				+| Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function addFloatx80Sigs(a: floatx80; b: floatx80, flag zSign ): floatx80;
			
 
				+begin
			
 
				+    int32 aExp, bExp, zExp;
			
 
				+    bits64 aSig, bSig, zSig0, zSig1;
			
 
				+    int32 expDiff;
			
 
				+
			
 
				+    aSig := extractFloatx80Frac( a );
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    bSig := extractFloatx80Frac( b );
			
 
				+    bExp := extractFloatx80Exp( b );
			
 
				+    expDiff := aExp - bExp;
			
 
				+    if ( 0 < expDiff ) begin
			
 
				+        if ( aExp = $7FFF ) begin
			
 
				+            if ( (bits64) ( aSig shl 1 ) ) result := propagateFloatx80NaN( a, b );
			
 
				+            result := a;
			
 
				+        end;
			
 
				+        if ( bExp = 0 ) --expDiff;
			
 
				+        shift64ExtraRightJamming( bSig, 0, expDiff, &bSig, &zSig1 );
			
 
				+        zExp := aExp;
			
 
				+    end;
			
 
				+    else if ( expDiff < 0 ) begin
			
 
				+        if ( bExp = $7FFF ) begin
			
 
				+            if ( (bits64) ( bSig shl 1 ) ) result := propagateFloatx80NaN( a, b );
			
 
				+            result := packFloatx80( zSign, $7FFF, LIT64( $8000000000000000 ) );
			
 
				+        end;
			
 
				+        if ( aExp = 0 ) ++expDiff;
			
 
				+        shift64ExtraRightJamming( aSig, 0, - expDiff, &aSig, &zSig1 );
			
 
				+        zExp := bExp;
			
 
				+    end;
			
 
				+    else begin
			
 
				+        if ( aExp = $7FFF ) begin
			
 
				+            if ( (bits64) ( ( aSig or bSig ) shl 1 ) ) begin
			
 
				+                result := propagateFloatx80NaN( a, b );
			
 
				+            end;
			
 
				+            result := a;
			
 
				+        end;
			
 
				+        zSig1 := 0;
			
 
				+        zSig0 := aSig + bSig;
			
 
				+        if ( aExp = 0 ) begin
			
 
				+            normalizeFloatx80Subnormal( zSig0, &zExp, &zSig0 );
			
 
				+            goto roundAndPack;
			
 
				+        end;
			
 
				+        zExp := aExp;
			
 
				+        goto shiftRight1;
			
 
				+    end;
			
 
				+    zSig0 := aSig + bSig;
			
 
				+    if ( (sbits64) zSig0 < 0 ) goto roundAndPack;
			
 
				+ shiftRight1:
			
 
				+    shift64ExtraRightJamming( zSig0, zSig1, 1, &zSig0, &zSig1 );
			
 
				+    zSig0 or= LIT64( $8000000000000000 );
			
 
				+    ++zExp;
			
 
				+ roundAndPack:
			
 
				+    result :=
			
 
				+        roundAndPackFloatx80(
			
 
				+            floatx80_rounding_precision, zSign, zExp, zSig0, zSig1 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of subtracting the absolute values of the extended
			
 
				+| double-precision floating-point values `a' and `b'.  If `zSign' is 1, the
			
 
				+| difference is negated before being returned.  `zSign' is ignored if the
			
 
				+| result is a NaN.  The subtraction is performed according to the IEC/IEEE
			
 
				+| Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function subFloatx80Sigs(a: floatx80; b: floatx80, flag zSign ): floatx80;
			
 
				+begin
			
 
				+    int32 aExp, bExp, zExp;
			
 
				+    bits64 aSig, bSig, zSig0, zSig1;
			
 
				+    int32 expDiff;
			
 
				+    floatx80 z;
			
 
				+
			
 
				+    aSig := extractFloatx80Frac( a );
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    bSig := extractFloatx80Frac( b );
			
 
				+    bExp := extractFloatx80Exp( b );
			
 
				+    expDiff := aExp - bExp;
			
 
				+    if ( 0 < expDiff ) goto aExpBigger;
			
 
				+    if ( expDiff < 0 ) goto bExpBigger;
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if ( (bits64) ( ( aSig or bSig ) shl 1 ) ) begin
			
 
				+            result := propagateFloatx80NaN( a, b );
			
 
				+        end;
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        z.low := floatx80_default_nan_low;
			
 
				+        z.high := floatx80_default_nan_high;
			
 
				+        result := z;
			
 
				+    end;
			
 
				+    if ( aExp = 0 ) begin
			
 
				+        aExp := 1;
			
 
				+        bExp := 1;
			
 
				+    end;
			
 
				+    zSig1 := 0;
			
 
				+    if ( bSig < aSig ) goto aBigger;
			
 
				+    if ( aSig < bSig ) goto bBigger;
			
 
				+    result := packFloatx80( float_rounding_mode = float_round_down, 0, 0 );
			
 
				+ bExpBigger:
			
 
				+    if ( bExp = $7FFF ) begin
			
 
				+        if ( (bits64) ( bSig shl 1 ) ) result := propagateFloatx80NaN( a, b );
			
 
				+        result := packFloatx80( zSign xor 1, $7FFF, LIT64( $8000000000000000 ) );
			
 
				+    end;
			
 
				+    if ( aExp = 0 ) ++expDiff;
			
 
				+    shift128RightJamming( aSig, 0, - expDiff, &aSig, &zSig1 );
			
 
				+ bBigger:
			
 
				+    sub128( bSig, 0, aSig, zSig1, &zSig0, &zSig1 );
			
 
				+    zExp := bExp;
			
 
				+    zSign  xor = 1;
			
 
				+    goto normalizeRoundAndPack;
			
 
				+ aExpBigger:
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if ( (bits64) ( aSig shl 1 ) ) result := propagateFloatx80NaN( a, b );
			
 
				+        result := a;
			
 
				+    end;
			
 
				+    if ( bExp = 0 ) --expDiff;
			
 
				+    shift128RightJamming( bSig, 0, expDiff, &bSig, &zSig1 );
			
 
				+ aBigger:
			
 
				+    sub128( aSig, 0, bSig, zSig1, &zSig0, &zSig1 );
			
 
				+    zExp := aExp;
			
 
				+ normalizeRoundAndPack:
			
 
				+    result :=
			
 
				+        normalizeRoundAndPackFloatx80(
			
 
				+            floatx80_rounding_precision, zSign, zExp, zSig0, zSig1 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of adding the extended double-precision floating-point
			
 
				+| values `a' and `b'.  The operation is performed according to the IEC/IEEE
			
 
				+| Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_add(a: floatx80; b: floatx80): floatx80;
			
 
				+begin
			
 
				+    flag aSign, bSign;
			
 
				+
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    bSign := extractFloatx80Sign( b );
			
 
				+    if ( aSign = bSign ) begin
			
 
				+        result := addFloatx80Sigs( a, b, aSign );
			
 
				+    end;
			
 
				+    else begin
			
 
				+        result := subFloatx80Sigs( a, b, aSign );
			
 
				+    end;
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of subtracting the extended double-precision floating-
			
 
				+| point values `a' and `b'.  The operation is performed according to the
			
 
				+| IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_sub(a: floatx80; b: floatx80 ): floatx80;
			
 
				+begin
			
 
				+    flag aSign, bSign;
			
 
				+
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    bSign := extractFloatx80Sign( b );
			
 
				+    if ( aSign = bSign ) begin
			
 
				+        result := subFloatx80Sigs( a, b, aSign );
			
 
				+    end;
			
 
				+    else begin
			
 
				+        result := addFloatx80Sigs( a, b, aSign );
			
 
				+    end;
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of multiplying the extended double-precision floating-
			
 
				+| point values `a' and `b'.  The operation is performed according to the
			
 
				+| IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_mul(a: floatx80; b: floatx80): floatx80;
			
 
				+begin
			
 
				+    flag aSign, bSign, zSign;
			
 
				+    int32 aExp, bExp, zExp;
			
 
				+    bits64 aSig, bSig, zSig0, zSig1;
			
 
				+    floatx80 z;
			
 
				+
			
 
				+    aSig := extractFloatx80Frac( a );
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    bSig := extractFloatx80Frac( b );
			
 
				+    bExp := extractFloatx80Exp( b );
			
 
				+    bSign := extractFloatx80Sign( b );
			
 
				+    zSign := aSign xor bSign;
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if (    (bits64) ( aSig shl 1 )
			
 
				+             or ( ( bExp = $7FFF ) and (bits64) ( bSig shl 1 ) ) ) begin
			
 
				+            result := propagateFloatx80NaN( a, b );
			
 
				+        end;
			
 
				+        if ( ( bExp or bSig ) = 0 ) goto invalid;
			
 
				+        result := packFloatx80( zSign, $7FFF, LIT64( $8000000000000000 ) );
			
 
				+    end;
			
 
				+    if ( bExp = $7FFF ) begin
			
 
				+        if ( (bits64) ( bSig shl 1 ) ) result := propagateFloatx80NaN( a, b );
			
 
				+        if ( ( aExp or aSig ) = 0 ) begin
			
 
				+ invalid:
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            z.low := floatx80_default_nan_low;
			
 
				+            z.high := floatx80_default_nan_high;
			
 
				+            result := z;
			
 
				+        end;
			
 
				+        result := packFloatx80( zSign, $7FFF, LIT64( $8000000000000000 ) );
			
 
				+    end;
			
 
				+    if ( aExp = 0 ) begin
			
 
				+        if ( aSig = 0 ) result := packFloatx80( zSign, 0, 0 );
			
 
				+        normalizeFloatx80Subnormal( aSig, &aExp, &aSig );
			
 
				+    end;
			
 
				+    if ( bExp = 0 ) begin
			
 
				+        if ( bSig = 0 ) result := packFloatx80( zSign, 0, 0 );
			
 
				+        normalizeFloatx80Subnormal( bSig, &bExp, &bSig );
			
 
				+    end;
			
 
				+    zExp := aExp + bExp - $3FFE;
			
 
				+    mul64To128( aSig, bSig, &zSig0, &zSig1 );
			
 
				+    if ( 0 < (sbits64) zSig0 ) begin
			
 
				+        shortShift128Left( zSig0, zSig1, 1, &zSig0, &zSig1 );
			
 
				+        --zExp;
			
 
				+    end;
			
 
				+    result :=
			
 
				+        roundAndPackFloatx80(
			
 
				+            floatx80_rounding_precision, zSign, zExp, zSig0, zSig1 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of dividing the extended double-precision floating-point
			
 
				+| value `a' by the corresponding value `b'.  The operation is performed
			
 
				+| according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_div(a: floatx80; b: floatx80 ): floatx80;
			
 
				+begin
			
 
				+    flag aSign, bSign, zSign;
			
 
				+    int32 aExp, bExp, zExp;
			
 
				+    bits64 aSig, bSig, zSig0, zSig1;
			
 
				+    bits64 rem0, rem1, rem2, term0, term1, term2;
			
 
				+    floatx80 z;
			
 
				+
			
 
				+    aSig := extractFloatx80Frac( a );
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    bSig := extractFloatx80Frac( b );
			
 
				+    bExp := extractFloatx80Exp( b );
			
 
				+    bSign := extractFloatx80Sign( b );
			
 
				+    zSign := aSign xor bSign;
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if ( (bits64) ( aSig shl 1 ) ) result := propagateFloatx80NaN( a, b );
			
 
				+        if ( bExp = $7FFF ) begin
			
 
				+            if ( (bits64) ( bSig shl 1 ) ) result := propagateFloatx80NaN( a, b );
			
 
				+            goto invalid;
			
 
				+        end;
			
 
				+        result := packFloatx80( zSign, $7FFF, LIT64( $8000000000000000 ) );
			
 
				+    end;
			
 
				+    if ( bExp = $7FFF ) begin
			
 
				+        if ( (bits64) ( bSig shl 1 ) ) result := propagateFloatx80NaN( a, b );
			
 
				+        result := packFloatx80( zSign, 0, 0 );
			
 
				+    end;
			
 
				+    if ( bExp = 0 ) begin
			
 
				+        if ( bSig = 0 ) begin
			
 
				+            if ( ( aExp or aSig ) = 0 ) begin
			
 
				+ invalid:
			
 
				+                float_raise( float_flag_invalid );
			
 
				+                z.low := floatx80_default_nan_low;
			
 
				+                z.high := floatx80_default_nan_high;
			
 
				+                result := z;
			
 
				+            end;
			
 
				+            float_raise( float_flag_divbyzero );
			
 
				+            result := packFloatx80( zSign, $7FFF, LIT64( $8000000000000000 ) );
			
 
				+        end;
			
 
				+        normalizeFloatx80Subnormal( bSig, &bExp, &bSig );
			
 
				+    end;
			
 
				+    if ( aExp = 0 ) begin
			
 
				+        if ( aSig = 0 ) result := packFloatx80( zSign, 0, 0 );
			
 
				+        normalizeFloatx80Subnormal( aSig, &aExp, &aSig );
			
 
				+    end;
			
 
				+    zExp := aExp - bExp + $3FFE;
			
 
				+    rem1 := 0;
			
 
				+    if ( bSig <= aSig ) begin
			
 
				+        shift128Right( aSig, 0, 1, &aSig, &rem1 );
			
 
				+        ++zExp;
			
 
				+    end;
			
 
				+    zSig0 := estimateDiv128To64( aSig, rem1, bSig );
			
 
				+    mul64To128( bSig, zSig0, &term0, &term1 );
			
 
				+    sub128( aSig, rem1, term0, term1, &rem0, &rem1 );
			
 
				+    while ( (sbits64) rem0 < 0 ) begin
			
 
				+        --zSig0;
			
 
				+        add128( rem0, rem1, 0, bSig, &rem0, &rem1 );
			
 
				+    end;
			
 
				+    zSig1 := estimateDiv128To64( rem1, 0, bSig );
			
 
				+    if ( (bits64) ( zSig1 shl 1 ) <= 8 ) begin
			
 
				+        mul64To128( bSig, zSig1, &term1, &term2 );
			
 
				+        sub128( rem1, 0, term1, term2, &rem1, &rem2 );
			
 
				+        while ( (sbits64) rem1 < 0 ) begin
			
 
				+            --zSig1;
			
 
				+            add128( rem1, rem2, 0, bSig, &rem1, &rem2 );
			
 
				+        end;
			
 
				+        zSig1 or= ( ( rem1 or rem2 ) <> 0 );
			
 
				+    end;
			
 
				+    result :=
			
 
				+        roundAndPackFloatx80(
			
 
				+            floatx80_rounding_precision, zSign, zExp, zSig0, zSig1 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the remainder of the extended double-precision floating-point value
			
 
				+| `a' with respect to the corresponding value `b'.  The operation is performed
			
 
				+| according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_rem(a: floatx80; b: floatx80 ): floatx80;
			
 
				+begin
			
 
				+    flag aSign, bSign, zSign;
			
 
				+    int32 aExp, bExp, expDiff;
			
 
				+    bits64 aSig0, aSig1, bSig;
			
 
				+    bits64 q, term0, term1, alternateASig0, alternateASig1;
			
 
				+    floatx80 z;
			
 
				+
			
 
				+    aSig0 := extractFloatx80Frac( a );
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    bSig := extractFloatx80Frac( b );
			
 
				+    bExp := extractFloatx80Exp( b );
			
 
				+    bSign := extractFloatx80Sign( b );
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if (    (bits64) ( aSig0 shl 1 )
			
 
				+             or ( ( bExp = $7FFF ) and (bits64) ( bSig shl 1 ) ) ) begin
			
 
				+            result := propagateFloatx80NaN( a, b );
			
 
				+        end;
			
 
				+        goto invalid;
			
 
				+    end;
			
 
				+    if ( bExp = $7FFF ) begin
			
 
				+        if ( (bits64) ( bSig shl 1 ) ) result := propagateFloatx80NaN( a, b );
			
 
				+        result := a;
			
 
				+    end;
			
 
				+    if ( bExp = 0 ) begin
			
 
				+        if ( bSig = 0 ) begin
			
 
				+ invalid:
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            z.low := floatx80_default_nan_low;
			
 
				+            z.high := floatx80_default_nan_high;
			
 
				+            result := z;
			
 
				+        end;
			
 
				+        normalizeFloatx80Subnormal( bSig, &bExp, &bSig );
			
 
				+    end;
			
 
				+    if ( aExp = 0 ) begin
			
 
				+        if ( (bits64) ( aSig0 shl 1 ) = 0 ) result := a;
			
 
				+        normalizeFloatx80Subnormal( aSig0, &aExp, &aSig0 );
			
 
				+    end;
			
 
				+    bSig or= LIT64( $8000000000000000 );
			
 
				+    zSign := aSign;
			
 
				+    expDiff := aExp - bExp;
			
 
				+    aSig1 := 0;
			
 
				+    if ( expDiff < 0 ) begin
			
 
				+        if ( expDiff < -1 ) result := a;
			
 
				+        shift128Right( aSig0, 0, 1, &aSig0, &aSig1 );
			
 
				+        expDiff := 0;
			
 
				+    end;
			
 
				+    q := ( bSig <= aSig0 );
			
 
				+    if ( q ) aSig0 -= bSig;
			
 
				+    expDiff -= 64;
			
 
				+    while ( 0 < expDiff ) begin
			
 
				+        q := estimateDiv128To64( aSig0, aSig1, bSig );
			
 
				+        q := ( 2 < q ) ? q - 2 : 0;
			
 
				+        mul64To128( bSig, q, &term0, &term1 );
			
 
				+        sub128( aSig0, aSig1, term0, term1, &aSig0, &aSig1 );
			
 
				+        shortShift128Left( aSig0, aSig1, 62, &aSig0, &aSig1 );
			
 
				+        expDiff -= 62;
			
 
				+    end;
			
 
				+    expDiff += 64;
			
 
				+    if ( 0 < expDiff ) begin
			
 
				+        q := estimateDiv128To64( aSig0, aSig1, bSig );
			
 
				+        q := ( 2 < q ) ? q - 2 : 0;
			
 
				+        q >>= 64 - expDiff;
			
 
				+        mul64To128( bSig, q shl ( 64 - expDiff ), &term0, &term1 );
			
 
				+        sub128( aSig0, aSig1, term0, term1, &aSig0, &aSig1 );
			
 
				+        shortShift128Left( 0, bSig, 64 - expDiff, &term0, &term1 );
			
 
				+        while ( le128( term0, term1, aSig0, aSig1 ) ) begin
			
 
				+            ++q;
			
 
				+            sub128( aSig0, aSig1, term0, term1, &aSig0, &aSig1 );
			
 
				+        end;
			
 
				+    end;
			
 
				+    else begin
			
 
				+        term1 := 0;
			
 
				+        term0 := bSig;
			
 
				+    end;
			
 
				+    sub128( term0, term1, aSig0, aSig1, &alternateASig0, &alternateASig1 );
			
 
				+    if (    lt128( alternateASig0, alternateASig1, aSig0, aSig1 )
			
 
				+         or (    eq128( alternateASig0, alternateASig1, aSig0, aSig1 )
			
 
				+              and ( q and 1 ) )
			
 
				+       ) begin
			
 
				+        aSig0 := alternateASig0;
			
 
				+        aSig1 := alternateASig1;
			
 
				+        zSign := ! zSign;
			
 
				+    end;
			
 
				+    result :=
			
 
				+        normalizeRoundAndPackFloatx80(
			
 
				+            80, zSign, bExp + expDiff, aSig0, aSig1 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the square root of the extended double-precision floating-point
			
 
				+| value `a'.  The operation is performed according to the IEC/IEEE Standard
			
 
				+| for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_sqrt(a: floatx80): floatx80;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp, zExp;
			
 
				+    bits64 aSig0, aSig1, zSig0, zSig1, doubleZSig0;
			
 
				+    bits64 rem0, rem1, rem2, rem3, term0, term1, term2, term3;
			
 
				+    floatx80 z;
			
 
				+
			
 
				+    aSig0 := extractFloatx80Frac( a );
			
 
				+    aExp := extractFloatx80Exp( a );
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if ( (bits64) ( aSig0 shl 1 ) ) result := propagateFloatx80NaN( a, a );
			
 
				+        if ( ! aSign ) result := a;
			
 
				+        goto invalid;
			
 
				+    end;
			
 
				+    if ( aSign ) begin
			
 
				+        if ( ( aExp or aSig0 ) = 0 ) result := a;
			
 
				+ invalid:
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        z.low := floatx80_default_nan_low;
			
 
				+        z.high := floatx80_default_nan_high;
			
 
				+        result := z;
			
 
				+    end;
			
 
				+    if ( aExp = 0 ) begin
			
 
				+        if ( aSig0 = 0 ) result := packFloatx80( 0, 0, 0 );
			
 
				+        normalizeFloatx80Subnormal( aSig0, &aExp, &aSig0 );
			
 
				+    end;
			
 
				+    zExp := ( ( aExp - $3FFF )>>1 ) + $3FFF;
			
 
				+    zSig0 := estimateSqrt32( aExp, aSig0>>32 );
			
 
				+    shift128Right( aSig0, 0, 2 + ( aExp and 1 ), &aSig0, &aSig1 );
			
 
				+    zSig0 := estimateDiv128To64( aSig0, aSig1, zSig0 shl 32 ) + ( zSig0 shl 30 );
			
 
				+    doubleZSig0 := zSig0 shl 1;
			
 
				+    mul64To128( zSig0, zSig0, &term0, &term1 );
			
 
				+    sub128( aSig0, aSig1, term0, term1, &rem0, &rem1 );
			
 
				+    while ( (sbits64) rem0 < 0 ) begin
			
 
				+        --zSig0;
			
 
				+        doubleZSig0 -= 2;
			
 
				+        add128( rem0, rem1, zSig0>>63, doubleZSig0 or 1, &rem0, &rem1 );
			
 
				+    end;
			
 
				+    zSig1 := estimateDiv128To64( rem1, 0, doubleZSig0 );
			
 
				+    if ( ( zSig1 and LIT64( $3FFFFFFFFFFFFFFF ) ) <= 5 ) begin
			
 
				+        if ( zSig1 = 0 ) zSig1 := 1;
			
 
				+        mul64To128( doubleZSig0, zSig1, &term1, &term2 );
			
 
				+        sub128( rem1, 0, term1, term2, &rem1, &rem2 );
			
 
				+        mul64To128( zSig1, zSig1, &term2, &term3 );
			
 
				+        sub192( rem1, rem2, 0, 0, term2, term3, &rem1, &rem2, &rem3 );
			
 
				+        while ( (sbits64) rem1 < 0 ) begin
			
 
				+            --zSig1;
			
 
				+            shortShift128Left( 0, zSig1, 1, &term2, &term3 );
			
 
				+            term3 or= 1;
			
 
				+            term2 or= doubleZSig0;
			
 
				+            add192( rem1, rem2, rem3, 0, term2, term3, &rem1, &rem2, &rem3 );
			
 
				+        end;
			
 
				+        zSig1 or= ( ( rem1 or rem2 or rem3 ) <> 0 );
			
 
				+    end;
			
 
				+    shortShift128Left( 0, zSig1, 1, &zSig0, &zSig1 );
			
 
				+    zSig0 or= doubleZSig0;
			
 
				+    result :=
			
 
				+        roundAndPackFloatx80(
			
 
				+            floatx80_rounding_precision, 0, zExp, zSig0, zSig1 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the extended double-precision floating-point value `a' is
			
 
				+| equal to the corresponding value `b', and 0 otherwise.  The comparison is
			
 
				+| performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+| Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_eq(a: floatx80; b: floatx80 ): flag;
			
 
				+begin
			
 
				+
			
 
				+    if (    (    ( extractFloatx80Exp( a ) = $7FFF )
			
 
				+              and (bits64) ( extractFloatx80Frac( a ) shl 1 ) )
			
 
				+         or (    ( extractFloatx80Exp( b ) = $7FFF )
			
 
				+              and (bits64) ( extractFloatx80Frac( b ) shl 1 ) )
			
 
				+       ) begin
			
 
				+        if (    floatx80_is_signaling_nan( a )
			
 
				+             or floatx80_is_signaling_nan( b ) ) begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+        end;
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    result :=
			
 
				+           ( a.low = b.low )
			
 
				+        and (    ( a.high = b.high )
			
 
				+             or (    ( a.low = 0 )
			
 
				+                  and ( (bits16) ( ( a.high or b.high ) shl 1 ) = 0 ) )
			
 
				+           );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the extended double-precision floating-point value `a' is
			
 
				+| less than or equal to the corresponding value `b', and 0 otherwise.  The
			
 
				+| comparison is performed according to the IEC/IEEE Standard for Binary
			
 
				+| Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_le(a: floatx80; b: floatx80 ): flag;
			
 
				+begin
			
 
				+    flag aSign, bSign;
			
 
				+
			
 
				+    if (    (    ( extractFloatx80Exp( a ) = $7FFF )
			
 
				+              and (bits64) ( extractFloatx80Frac( a ) shl 1 ) )
			
 
				+         or (    ( extractFloatx80Exp( b ) = $7FFF )
			
 
				+              and (bits64) ( extractFloatx80Frac( b ) shl 1 ) )
			
 
				+       ) begin
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    bSign := extractFloatx80Sign( b );
			
 
				+    if ( aSign <> bSign ) begin
			
 
				+        result :=
			
 
				+               aSign
			
 
				+            or (    ( ( (bits16) ( ( a.high or b.high ) shl 1 ) ) or a.low or b.low )
			
 
				+                 = 0 );
			
 
				+    end;
			
 
				+    result :=
			
 
				+          aSign ? le128( b.high, b.low, a.high, a.low )
			
 
				+        : le128( a.high, a.low, b.high, b.low );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the extended double-precision floating-point value `a' is
			
 
				+| less than the corresponding value `b', and 0 otherwise.  The comparison
			
 
				+| is performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+| Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_lt(a: floatx80; b: floatx80 ): flag;
			
 
				+begin
			
 
				+    flag aSign, bSign;
			
 
				+
			
 
				+    if (    (    ( extractFloatx80Exp( a ) = $7FFF )
			
 
				+              and (bits64) ( extractFloatx80Frac( a ) shl 1 ) )
			
 
				+         or (    ( extractFloatx80Exp( b ) = $7FFF )
			
 
				+              and (bits64) ( extractFloatx80Frac( b ) shl 1 ) )
			
 
				+       ) begin
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    bSign := extractFloatx80Sign( b );
			
 
				+    if ( aSign <> bSign ) begin
			
 
				+        result :=
			
 
				+               aSign
			
 
				+            and (    ( ( (bits16) ( ( a.high or b.high ) shl 1 ) ) or a.low or b.low )
			
 
				+                 <> 0 );
			
 
				+    end;
			
 
				+    result :=
			
 
				+          aSign ? lt128( b.high, b.low, a.high, a.low )
			
 
				+        : lt128( a.high, a.low, b.high, b.low );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the extended double-precision floating-point value `a' is equal
			
 
				+| to the corresponding value `b', and 0 otherwise.  The invalid exception is
			
 
				+| raised if either operand is a NaN.  Otherwise, the comparison is performed
			
 
				+| according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_eq_signaling(a: floatx80; b: floatx80 ): flag;
			
 
				+begin
			
 
				+
			
 
				+    if (    (    ( extractFloatx80Exp( a ) = $7FFF )
			
 
				+              and (bits64) ( extractFloatx80Frac( a ) shl 1 ) )
			
 
				+         or (    ( extractFloatx80Exp( b ) = $7FFF )
			
 
				+              and (bits64) ( extractFloatx80Frac( b ) shl 1 ) )
			
 
				+       ) begin
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    result :=
			
 
				+           ( a.low = b.low )
			
 
				+        and (    ( a.high = b.high )
			
 
				+             or (    ( a.low = 0 )
			
 
				+                  and ( (bits16) ( ( a.high or b.high ) shl 1 ) = 0 ) )
			
 
				+           );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the extended double-precision floating-point value `a' is less
			
 
				+| than or equal to the corresponding value `b', and 0 otherwise.  Quiet NaNs
			
 
				+| do not cause an exception.  Otherwise, the comparison is performed according
			
 
				+| to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_le_quiet(a: floatx80; b: floatx80 ): flag;
			
 
				+begin
			
 
				+    flag aSign, bSign;
			
 
				+
			
 
				+    if (    (    ( extractFloatx80Exp( a ) = $7FFF )
			
 
				+              and (bits64) ( extractFloatx80Frac( a ) shl 1 ) )
			
 
				+         or (    ( extractFloatx80Exp( b ) = $7FFF )
			
 
				+              and (bits64) ( extractFloatx80Frac( b ) shl 1 ) )
			
 
				+       ) begin
			
 
				+        if (    floatx80_is_signaling_nan( a )
			
 
				+             or floatx80_is_signaling_nan( b ) ) begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+        end;
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    bSign := extractFloatx80Sign( b );
			
 
				+    if ( aSign <> bSign ) begin
			
 
				+        result :=
			
 
				+               aSign
			
 
				+            or (    ( ( (bits16) ( ( a.high or b.high ) shl 1 ) ) or a.low or b.low )
			
 
				+                 = 0 );
			
 
				+    end;
			
 
				+    result :=
			
 
				+          aSign ? le128( b.high, b.low, a.high, a.low )
			
 
				+        : le128( a.high, a.low, b.high, b.low );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the extended double-precision floating-point value `a' is less
			
 
				+| than the corresponding value `b', and 0 otherwise.  Quiet NaNs do not cause
			
 
				+| an exception.  Otherwise, the comparison is performed according to the
			
 
				+| IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function floatx80_lt_quiet(a: floatx80; b: floatx80 ): flag;
			
 
				+begin
			
 
				+    flag aSign, bSign;
			
 
				+
			
 
				+    if (    (    ( extractFloatx80Exp( a ) = $7FFF )
			
 
				+              and (bits64) ( extractFloatx80Frac( a ) shl 1 ) )
			
 
				+         or (    ( extractFloatx80Exp( b ) = $7FFF )
			
 
				+              and (bits64) ( extractFloatx80Frac( b ) shl 1 ) )
			
 
				+       ) begin
			
 
				+        if (    floatx80_is_signaling_nan( a )
			
 
				+             or floatx80_is_signaling_nan( b ) ) begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+        end;
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    aSign := extractFloatx80Sign( a );
			
 
				+    bSign := extractFloatx80Sign( b );
			
 
				+    if ( aSign <> bSign ) begin
			
 
				+        result :=
			
 
				+               aSign
			
 
				+            and (    ( ( (bits16) ( ( a.high or b.high ) shl 1 ) ) or a.low or b.low )
			
 
				+                 <> 0 );
			
 
				+    end;
			
 
				+    result :=
			
 
				+          aSign ? lt128( b.high, b.low, a.high, a.low )
			
 
				+        : lt128( a.high, a.low, b.high, b.low );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{$endif FPC_SOFTFLOAT_FLOATX80}
			
 
				+
			
 
				+
			
 
				+{$ifdef FPC_SOFTFLOAT_FLOAT128}
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the quadruple-precision floating-point
			
 
				+| value `a' to the 32-bit two's complement integer format.  The conversion
			
 
				+| is performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+| Arithmetic---which means in particular that the conversion is rounded
			
 
				+| according to the current rounding mode.  If `a' is a NaN, the largest
			
 
				+| positive integer is returned.  Otherwise, if the conversion overflows, the
			
 
				+| largest integer with the same sign as `a' is returned.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_to_int32(a: float128): int32;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp, shiftCount;
			
 
				+    bits64 aSig0, aSig1;
			
 
				+
			
 
				+    aSig1 := extractFloat128Frac1( a );
			
 
				+    aSig0 := extractFloat128Frac0( a );
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    if ( ( aExp = $7FFF ) and ( aSig0 or aSig1 ) ) aSign := 0;
			
 
				+    if ( aExp ) aSig0 or= LIT64( $0001000000000000 );
			
 
				+    aSig0 or= ( aSig1 <> 0 );
			
 
				+    shiftCount := $4028 - aExp;
			
 
				+    if ( 0 < shiftCount ) shift64RightJamming( aSig0, shiftCount, &aSig0 );
			
 
				+    result := roundAndPackInt32( aSign, aSig0 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the quadruple-precision floating-point
			
 
				+| value `a' to the 32-bit two's complement integer format.  The conversion
			
 
				+| is performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+| Arithmetic, except that the conversion is always rounded toward zero.  If
			
 
				+| `a' is a NaN, the largest positive integer is returned.  Otherwise, if the
			
 
				+| conversion overflows, the largest integer with the same sign as `a' is
			
 
				+| returned.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_to_int32_round_to_zero(a: float128): int32;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp, shiftCount;
			
 
				+    bits64 aSig0, aSig1, savedASig;
			
 
				+    int32 z;
			
 
				+
			
 
				+    aSig1 := extractFloat128Frac1( a );
			
 
				+    aSig0 := extractFloat128Frac0( a );
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    aSig0 or= ( aSig1 <> 0 );
			
 
				+    if ( $401E < aExp ) begin
			
 
				+        if ( ( aExp = $7FFF ) and aSig0 ) aSign := 0;
			
 
				+        goto invalid;
			
 
				+    end;
			
 
				+    else if ( aExp < $3FFF ) begin
			
 
				+        if ( aExp or aSig0 ) float_exception_flags or= float_flag_inexact;
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    aSig0 or= LIT64( $0001000000000000 );
			
 
				+    shiftCount := $402F - aExp;
			
 
				+    savedASig := aSig0;
			
 
				+    aSig0 >>= shiftCount;
			
 
				+    z := aSig0;
			
 
				+    if ( aSign ) z := - z;
			
 
				+    if ( ( z < 0 ) xor aSign ) begin
			
 
				+ invalid:
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        result := aSign ? (sbits32) $80000000 : $7FFFFFFF;
			
 
				+    end;
			
 
				+    if ( ( aSig0 shl shiftCount ) <> savedASig ) begin
			
 
				+        float_exception_flags or= float_flag_inexact;
			
 
				+    end;
			
 
				+    result := z;
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the quadruple-precision floating-point
			
 
				+| value `a' to the 64-bit two's complement integer format.  The conversion
			
 
				+| is performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+| Arithmetic---which means in particular that the conversion is rounded
			
 
				+| according to the current rounding mode.  If `a' is a NaN, the largest
			
 
				+| positive integer is returned.  Otherwise, if the conversion overflows, the
			
 
				+| largest integer with the same sign as `a' is returned.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_to_int64(a: float128): int64;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp, shiftCount;
			
 
				+    bits64 aSig0, aSig1;
			
 
				+
			
 
				+    aSig1 := extractFloat128Frac1( a );
			
 
				+    aSig0 := extractFloat128Frac0( a );
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    if ( aExp ) aSig0 or= LIT64( $0001000000000000 );
			
 
				+    shiftCount := $402F - aExp;
			
 
				+    if ( shiftCount <= 0 ) begin
			
 
				+        if ( $403E < aExp ) begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            if (    ! aSign
			
 
				+                 or (    ( aExp = $7FFF )
			
 
				+                      and ( aSig1 or ( aSig0 <> LIT64( $0001000000000000 ) ) )
			
 
				+                    )
			
 
				+               ) begin
			
 
				+                result := LIT64( $7FFFFFFFFFFFFFFF );
			
 
				+            end;
			
 
				+            result := (sbits64) LIT64( $8000000000000000 );
			
 
				+        end;
			
 
				+        shortShift128Left( aSig0, aSig1, - shiftCount, &aSig0, &aSig1 );
			
 
				+    end;
			
 
				+    else begin
			
 
				+        shift64ExtraRightJamming( aSig0, aSig1, shiftCount, &aSig0, &aSig1 );
			
 
				+    end;
			
 
				+    result := roundAndPackInt64( aSign, aSig0, aSig1 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the quadruple-precision floating-point
			
 
				+| value `a' to the 64-bit two's complement integer format.  The conversion
			
 
				+| is performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+| Arithmetic, except that the conversion is always rounded toward zero.
			
 
				+| If `a' is a NaN, the largest positive integer is returned.  Otherwise, if
			
 
				+| the conversion overflows, the largest integer with the same sign as `a' is
			
 
				+| returned.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_to_int64_round_to_zero(a: float128): int64;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp, shiftCount;
			
 
				+    bits64 aSig0, aSig1;
			
 
				+    int64 z;
			
 
				+
			
 
				+    aSig1 := extractFloat128Frac1( a );
			
 
				+    aSig0 := extractFloat128Frac0( a );
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    if ( aExp ) aSig0 or= LIT64( $0001000000000000 );
			
 
				+    shiftCount := aExp - $402F;
			
 
				+    if ( 0 < shiftCount ) begin
			
 
				+        if ( $403E <= aExp ) begin
			
 
				+            aSig0 &= LIT64( $0000FFFFFFFFFFFF );
			
 
				+            if (    ( a.high = LIT64( $C03E000000000000 ) )
			
 
				+                 and ( aSig1 < LIT64( $0002000000000000 ) ) ) begin
			
 
				+                if ( aSig1 ) float_exception_flags or= float_flag_inexact;
			
 
				+            end;
			
 
				+            else begin
			
 
				+                float_raise( float_flag_invalid );
			
 
				+                if ( ! aSign or ( ( aExp = $7FFF ) and ( aSig0 or aSig1 ) ) ) begin
			
 
				+                    result := LIT64( $7FFFFFFFFFFFFFFF );
			
 
				+                end;
			
 
				+            end;
			
 
				+            result := (sbits64) LIT64( $8000000000000000 );
			
 
				+        end;
			
 
				+        z := ( aSig0 shl shiftCount ) or ( aSig1>>( ( - shiftCount ) and 63 ) );
			
 
				+        if ( (bits64) ( aSig1 shl shiftCount ) ) begin
			
 
				+            float_exception_flags or= float_flag_inexact;
			
 
				+        end;
			
 
				+    end;
			
 
				+    else begin
			
 
				+        if ( aExp < $3FFF ) begin
			
 
				+            if ( aExp or aSig0 or aSig1 ) begin
			
 
				+                float_exception_flags or= float_flag_inexact;
			
 
				+            end;
			
 
				+            result := 0;
			
 
				+        end;
			
 
				+        z := aSig0>>( - shiftCount );
			
 
				+        if (    aSig1
			
 
				+             or ( shiftCount and (bits64) ( aSig0 shl ( shiftCount and 63 ) ) ) ) begin
			
 
				+            float_exception_flags or= float_flag_inexact;
			
 
				+        end;
			
 
				+    end;
			
 
				+    if ( aSign ) z := - z;
			
 
				+    result := z;
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the quadruple-precision floating-point
			
 
				+| value `a' to the single-precision floating-point format.  The conversion
			
 
				+| is performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+| Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_to_float32(a: float128): float32;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp;
			
 
				+    bits64 aSig0, aSig1;
			
 
				+    bits32 zSig;
			
 
				+
			
 
				+    aSig1 := extractFloat128Frac1( a );
			
 
				+    aSig0 := extractFloat128Frac0( a );
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if ( aSig0 or aSig1 ) begin
			
 
				+            result := commonNaNToFloat32( float128ToCommonNaN( a ) );
			
 
				+        end;
			
 
				+        result := packFloat32( aSign, $FF, 0 );
			
 
				+    end;
			
 
				+    aSig0 or= ( aSig1 <> 0 );
			
 
				+    shift64RightJamming( aSig0, 18, &aSig0 );
			
 
				+    zSig := aSig0;
			
 
				+    if ( aExp or zSig ) begin
			
 
				+        zSig or= $40000000;
			
 
				+        aExp -= $3F81;
			
 
				+    end;
			
 
				+    result := roundAndPackFloat32( aSign, aExp, zSig );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the quadruple-precision floating-point
			
 
				+| value `a' to the double-precision floating-point format.  The conversion
			
 
				+| is performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+| Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_to_float64(a: float128): float64;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp;
			
 
				+    bits64 aSig0, aSig1;
			
 
				+
			
 
				+    aSig1 := extractFloat128Frac1( a );
			
 
				+    aSig0 := extractFloat128Frac0( a );
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if ( aSig0 or aSig1 ) begin
			
 
				+            result := commonNaNToFloat64( float128ToCommonNaN( a ) );
			
 
				+        end;
			
 
				+        result := packFloat64( aSign, $7FF, 0 );
			
 
				+    end;
			
 
				+    shortShift128Left( aSig0, aSig1, 14, &aSig0, &aSig1 );
			
 
				+    aSig0 or= ( aSig1 <> 0 );
			
 
				+    if ( aExp or aSig0 ) begin
			
 
				+        aSig0 or= LIT64( $4000000000000000 );
			
 
				+        aExp -= $3C01;
			
 
				+    end;
			
 
				+    result := roundAndPackFloat64( aSign, aExp, aSig0 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{$ifdef FPC_SOFTFLOAT_FLOATX80}
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the quadruple-precision floating-point
			
 
				+| value `a' to the extended double-precision floating-point format.  The
			
 
				+| conversion is performed according to the IEC/IEEE Standard for Binary
			
 
				+| Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_to_floatx80(a: float128): floatx80;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp;
			
 
				+    bits64 aSig0, aSig1;
			
 
				+
			
 
				+    aSig1 := extractFloat128Frac1( a );
			
 
				+    aSig0 := extractFloat128Frac0( a );
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if ( aSig0 or aSig1 ) begin
			
 
				+            result := commonNaNToFloatx80( float128ToCommonNaN( a ) );
			
 
				+        end;
			
 
				+        result := packFloatx80( aSign, $7FFF, LIT64( $8000000000000000 ) );
			
 
				+    end;
			
 
				+    if ( aExp = 0 ) begin
			
 
				+        if ( ( aSig0 or aSig1 ) = 0 ) result := packFloatx80( aSign, 0, 0 );
			
 
				+        normalizeFloat128Subnormal( aSig0, aSig1, &aExp, &aSig0, &aSig1 );
			
 
				+    end;
			
 
				+    else begin
			
 
				+        aSig0 or= LIT64( $0001000000000000 );
			
 
				+    end;
			
 
				+    shortShift128Left( aSig0, aSig1, 15, &aSig0, &aSig1 );
			
 
				+    result := roundAndPackFloatx80( 80, aSign, aExp, aSig0, aSig1 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{$endif FPC_SOFTFLOAT_FLOATX80}
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Rounds the quadruple-precision floating-point value `a' to an integer, and
			
 
				+| Returns the result as a quadruple-precision floating-point value.  The
			
 
				+| operation is performed according to the IEC/IEEE Standard for Binary
			
 
				+| Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_round_to_int(a: float128): float128;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp;
			
 
				+    bits64 lastBitMask, roundBitsMask;
			
 
				+    int8 roundingMode;
			
 
				+    float128 z;
			
 
				+
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    if ( $402F <= aExp ) begin
			
 
				+        if ( $406F <= aExp ) begin
			
 
				+            if (    ( aExp = $7FFF )
			
 
				+                 and ( extractFloat128Frac0( a ) or extractFloat128Frac1( a ) )
			
 
				+               ) begin
			
 
				+                result := propagateFloat128NaN( a, a );
			
 
				+            end;
			
 
				+            result := a;
			
 
				+        end;
			
 
				+        lastBitMask := 1;
			
 
				+        lastBitMask := ( lastBitMask shl ( $406E - aExp ) ) shl 1;
			
 
				+        roundBitsMask := lastBitMask - 1;
			
 
				+        z := a;
			
 
				+        roundingMode := float_rounding_mode;
			
 
				+        if ( roundingMode = float_round_nearest_even ) begin
			
 
				+            if ( lastBitMask ) begin
			
 
				+                add128( z.high, z.low, 0, lastBitMask>>1, &z.high, &z.low );
			
 
				+                if ( ( z.low and roundBitsMask ) = 0 ) z.low &= ~ lastBitMask;
			
 
				+            end;
			
 
				+            else begin
			
 
				+                if ( (sbits64) z.low < 0 ) begin
			
 
				+                    ++z.high;
			
 
				+                    if ( (bits64) ( z.low shl 1 ) = 0 ) z.high &= ~1;
			
 
				+                end;
			
 
				+            end;
			
 
				+        end;
			
 
				+        else if ( roundingMode <> float_round_to_zero ) begin
			
 
				+            if (   extractFloat128Sign( z )
			
 
				+                 xor ( roundingMode = float_round_up ) ) begin
			
 
				+                add128( z.high, z.low, 0, roundBitsMask, &z.high, &z.low );
			
 
				+            end;
			
 
				+        end;
			
 
				+        z.low &= ~ roundBitsMask;
			
 
				+    end;
			
 
				+    else begin
			
 
				+        if ( aExp < $3FFF ) begin
			
 
				+            if ( ( ( (bits64) ( a.high shl 1 ) ) or a.low ) = 0 ) result := a;
			
 
				+            float_exception_flags or= float_flag_inexact;
			
 
				+            aSign := extractFloat128Sign( a );
			
 
				+            switch ( float_rounding_mode ) begin
			
 
				+             case float_round_nearest_even:
			
 
				+                if (    ( aExp = $3FFE )
			
 
				+                     and (   extractFloat128Frac0( a )
			
 
				+                          or extractFloat128Frac1( a ) )
			
 
				+                   ) begin
			
 
				+                    result := packFloat128( aSign, $3FFF, 0, 0 );
			
 
				+                end;
			
 
				+                break;
			
 
				+             case float_round_down:
			
 
				+                result :=
			
 
				+                      aSign ? packFloat128( 1, $3FFF, 0, 0 )
			
 
				+                    : packFloat128( 0, 0, 0, 0 );
			
 
				+             case float_round_up:
			
 
				+                result :=
			
 
				+                      aSign ? packFloat128( 1, 0, 0, 0 )
			
 
				+                    : packFloat128( 0, $3FFF, 0, 0 );
			
 
				+            end;
			
 
				+            result := packFloat128( aSign, 0, 0, 0 );
			
 
				+        end;
			
 
				+        lastBitMask := 1;
			
 
				+        lastBitMask  shl = $402F - aExp;
			
 
				+        roundBitsMask := lastBitMask - 1;
			
 
				+        z.low := 0;
			
 
				+        z.high := a.high;
			
 
				+        roundingMode := float_rounding_mode;
			
 
				+        if ( roundingMode = float_round_nearest_even ) begin
			
 
				+            z.high += lastBitMask>>1;
			
 
				+            if ( ( ( z.high and roundBitsMask ) or a.low ) = 0 ) begin
			
 
				+                z.high &= ~ lastBitMask;
			
 
				+            end;
			
 
				+        end;
			
 
				+        else if ( roundingMode <> float_round_to_zero ) begin
			
 
				+            if (   extractFloat128Sign( z )
			
 
				+                 xor ( roundingMode = float_round_up ) ) begin
			
 
				+                z.high or= ( a.low <> 0 );
			
 
				+                z.high += roundBitsMask;
			
 
				+            end;
			
 
				+        end;
			
 
				+        z.high &= ~ roundBitsMask;
			
 
				+    end;
			
 
				+    if ( ( z.low <> a.low ) or ( z.high <> a.high ) ) begin
			
 
				+        float_exception_flags or= float_flag_inexact;
			
 
				+    end;
			
 
				+    result := z;
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of adding the absolute values of the quadruple-precision
			
 
				+| floating-point values `a' and `b'.  If `zSign' is 1, the sum is negated
			
 
				+| before being returned.  `zSign' is ignored if the result is a NaN.
			
 
				+| The addition is performed according to the IEC/IEEE Standard for Binary
			
 
				+| Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function addFloat128Sigs( float128 a, float128 b, flag zSign ): float128;
			
 
				+begin
			
 
				+    int32 aExp, bExp, zExp;
			
 
				+    bits64 aSig0, aSig1, bSig0, bSig1, zSig0, zSig1, zSig2;
			
 
				+    int32 expDiff;
			
 
				+
			
 
				+    aSig1 := extractFloat128Frac1( a );
			
 
				+    aSig0 := extractFloat128Frac0( a );
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    bSig1 := extractFloat128Frac1( b );
			
 
				+    bSig0 := extractFloat128Frac0( b );
			
 
				+    bExp := extractFloat128Exp( b );
			
 
				+    expDiff := aExp - bExp;
			
 
				+    if ( 0 < expDiff ) begin
			
 
				+        if ( aExp = $7FFF ) begin
			
 
				+            if ( aSig0 or aSig1 ) result := propagateFloat128NaN( a, b );
			
 
				+            result := a;
			
 
				+        end;
			
 
				+        if ( bExp = 0 ) begin
			
 
				+            --expDiff;
			
 
				+        end;
			
 
				+        else begin
			
 
				+            bSig0 or= LIT64( $0001000000000000 );
			
 
				+        end;
			
 
				+        shift128ExtraRightJamming(
			
 
				+            bSig0, bSig1, 0, expDiff, &bSig0, &bSig1, &zSig2 );
			
 
				+        zExp := aExp;
			
 
				+    end;
			
 
				+    else if ( expDiff < 0 ) begin
			
 
				+        if ( bExp = $7FFF ) begin
			
 
				+            if ( bSig0 or bSig1 ) result := propagateFloat128NaN( a, b );
			
 
				+            result := packFloat128( zSign, $7FFF, 0, 0 );
			
 
				+        end;
			
 
				+        if ( aExp = 0 ) begin
			
 
				+            ++expDiff;
			
 
				+        end;
			
 
				+        else begin
			
 
				+            aSig0 or= LIT64( $0001000000000000 );
			
 
				+        end;
			
 
				+        shift128ExtraRightJamming(
			
 
				+            aSig0, aSig1, 0, - expDiff, &aSig0, &aSig1, &zSig2 );
			
 
				+        zExp := bExp;
			
 
				+    end;
			
 
				+    else begin
			
 
				+        if ( aExp = $7FFF ) begin
			
 
				+            if ( aSig0 or aSig1 or bSig0 or bSig1 ) begin
			
 
				+                result := propagateFloat128NaN( a, b );
			
 
				+            end;
			
 
				+            result := a;
			
 
				+        end;
			
 
				+        add128( aSig0, aSig1, bSig0, bSig1, &zSig0, &zSig1 );
			
 
				+        if ( aExp = 0 ) result := packFloat128( zSign, 0, zSig0, zSig1 );
			
 
				+        zSig2 := 0;
			
 
				+        zSig0 or= LIT64( $0002000000000000 );
			
 
				+        zExp := aExp;
			
 
				+        goto shiftRight1;
			
 
				+    end;
			
 
				+    aSig0 or= LIT64( $0001000000000000 );
			
 
				+    add128( aSig0, aSig1, bSig0, bSig1, &zSig0, &zSig1 );
			
 
				+    --zExp;
			
 
				+    if ( zSig0 < LIT64( $0002000000000000 ) ) goto roundAndPack;
			
 
				+    ++zExp;
			
 
				+ shiftRight1:
			
 
				+    shift128ExtraRightJamming(
			
 
				+        zSig0, zSig1, zSig2, 1, &zSig0, &zSig1, &zSig2 );
			
 
				+ roundAndPack:
			
 
				+    result := roundAndPackFloat128( zSign, zExp, zSig0, zSig1, zSig2 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of subtracting the absolute values of the quadruple-
			
 
				+| precision floating-point values `a' and `b'.  If `zSign' is 1, the
			
 
				+| difference is negated before being returned.  `zSign' is ignored if the
			
 
				+| result is a NaN.  The subtraction is performed according to the IEC/IEEE
			
 
				+| Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function subFloat128Sigs( float128 a, float128 b, flag zSign ): float128;
			
 
				+begin
			
 
				+    int32 aExp, bExp, zExp;
			
 
				+    bits64 aSig0, aSig1, bSig0, bSig1, zSig0, zSig1;
			
 
				+    int32 expDiff;
			
 
				+    float128 z;
			
 
				+
			
 
				+    aSig1 := extractFloat128Frac1( a );
			
 
				+    aSig0 := extractFloat128Frac0( a );
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    bSig1 := extractFloat128Frac1( b );
			
 
				+    bSig0 := extractFloat128Frac0( b );
			
 
				+    bExp := extractFloat128Exp( b );
			
 
				+    expDiff := aExp - bExp;
			
 
				+    shortShift128Left( aSig0, aSig1, 14, &aSig0, &aSig1 );
			
 
				+    shortShift128Left( bSig0, bSig1, 14, &bSig0, &bSig1 );
			
 
				+    if ( 0 < expDiff ) goto aExpBigger;
			
 
				+    if ( expDiff < 0 ) goto bExpBigger;
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if ( aSig0 or aSig1 or bSig0 or bSig1 ) begin
			
 
				+            result := propagateFloat128NaN( a, b );
			
 
				+        end;
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        z.low := float128_default_nan_low;
			
 
				+        z.high := float128_default_nan_high;
			
 
				+        result := z;
			
 
				+    end;
			
 
				+    if ( aExp = 0 ) begin
			
 
				+        aExp := 1;
			
 
				+        bExp := 1;
			
 
				+    end;
			
 
				+    if ( bSig0 < aSig0 ) goto aBigger;
			
 
				+    if ( aSig0 < bSig0 ) goto bBigger;
			
 
				+    if ( bSig1 < aSig1 ) goto aBigger;
			
 
				+    if ( aSig1 < bSig1 ) goto bBigger;
			
 
				+    result := packFloat128( float_rounding_mode = float_round_down, 0, 0, 0 );
			
 
				+ bExpBigger:
			
 
				+    if ( bExp = $7FFF ) begin
			
 
				+        if ( bSig0 or bSig1 ) result := propagateFloat128NaN( a, b );
			
 
				+        result := packFloat128( zSign xor 1, $7FFF, 0, 0 );
			
 
				+    end;
			
 
				+    if ( aExp = 0 ) begin
			
 
				+        ++expDiff;
			
 
				+    end;
			
 
				+    else begin
			
 
				+        aSig0 or= LIT64( $4000000000000000 );
			
 
				+    end;
			
 
				+    shift128RightJamming( aSig0, aSig1, - expDiff, &aSig0, &aSig1 );
			
 
				+    bSig0 or= LIT64( $4000000000000000 );
			
 
				+ bBigger:
			
 
				+    sub128( bSig0, bSig1, aSig0, aSig1, &zSig0, &zSig1 );
			
 
				+    zExp := bExp;
			
 
				+    zSign  xor = 1;
			
 
				+    goto normalizeRoundAndPack;
			
 
				+ aExpBigger:
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if ( aSig0 or aSig1 ) result := propagateFloat128NaN( a, b );
			
 
				+        result := a;
			
 
				+    end;
			
 
				+    if ( bExp = 0 ) begin
			
 
				+        --expDiff;
			
 
				+    end;
			
 
				+    else begin
			
 
				+        bSig0 or= LIT64( $4000000000000000 );
			
 
				+    end;
			
 
				+    shift128RightJamming( bSig0, bSig1, expDiff, &bSig0, &bSig1 );
			
 
				+    aSig0 or= LIT64( $4000000000000000 );
			
 
				+ aBigger:
			
 
				+    sub128( aSig0, aSig1, bSig0, bSig1, &zSig0, &zSig1 );
			
 
				+    zExp := aExp;
			
 
				+ normalizeRoundAndPack:
			
 
				+    --zExp;
			
 
				+    result := normalizeRoundAndPackFloat128( zSign, zExp - 14, zSig0, zSig1 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of adding the quadruple-precision floating-point values
			
 
				+| `a' and `b'.  The operation is performed according to the IEC/IEEE Standard
			
 
				+| for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_add(a: float128; b: float128): float128;
			
 
				+begin
			
 
				+    flag aSign, bSign;
			
 
				+
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    bSign := extractFloat128Sign( b );
			
 
				+    if ( aSign = bSign ) begin
			
 
				+        result := addFloat128Sigs( a, b, aSign );
			
 
				+    end;
			
 
				+    else begin
			
 
				+        result := subFloat128Sigs( a, b, aSign );
			
 
				+    end;
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of subtracting the quadruple-precision floating-point
			
 
				+| values `a' and `b'.  The operation is performed according to the IEC/IEEE
			
 
				+| Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_sub(a: float128; b: float128): float128;
			
 
				+begin
			
 
				+    flag aSign, bSign;
			
 
				+
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    bSign := extractFloat128Sign( b );
			
 
				+    if ( aSign = bSign ) begin
			
 
				+        result := subFloat128Sigs( a, b, aSign );
			
 
				+    end;
			
 
				+    else begin
			
 
				+        result := addFloat128Sigs( a, b, aSign );
			
 
				+    end;
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of multiplying the quadruple-precision floating-point
			
 
				+| values `a' and `b'.  The operation is performed according to the IEC/IEEE
			
 
				+| Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_mul(a: float128; b: float128): float128;
			
 
				+begin
			
 
				+    flag aSign, bSign, zSign;
			
 
				+    int32 aExp, bExp, zExp;
			
 
				+    bits64 aSig0, aSig1, bSig0, bSig1, zSig0, zSig1, zSig2, zSig3;
			
 
				+    float128 z;
			
 
				+
			
 
				+    aSig1 := extractFloat128Frac1( a );
			
 
				+    aSig0 := extractFloat128Frac0( a );
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    bSig1 := extractFloat128Frac1( b );
			
 
				+    bSig0 := extractFloat128Frac0( b );
			
 
				+    bExp := extractFloat128Exp( b );
			
 
				+    bSign := extractFloat128Sign( b );
			
 
				+    zSign := aSign xor bSign;
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if (    ( aSig0 or aSig1 )
			
 
				+             or ( ( bExp = $7FFF ) and ( bSig0 or bSig1 ) ) ) begin
			
 
				+            result := propagateFloat128NaN( a, b );
			
 
				+        end;
			
 
				+        if ( ( bExp or bSig0 or bSig1 ) = 0 ) goto invalid;
			
 
				+        result := packFloat128( zSign, $7FFF, 0, 0 );
			
 
				+    end;
			
 
				+    if ( bExp = $7FFF ) begin
			
 
				+        if ( bSig0 or bSig1 ) result := propagateFloat128NaN( a, b );
			
 
				+        if ( ( aExp or aSig0 or aSig1 ) = 0 ) begin
			
 
				+ invalid:
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            z.low := float128_default_nan_low;
			
 
				+            z.high := float128_default_nan_high;
			
 
				+            result := z;
			
 
				+        end;
			
 
				+        result := packFloat128( zSign, $7FFF, 0, 0 );
			
 
				+    end;
			
 
				+    if ( aExp = 0 ) begin
			
 
				+        if ( ( aSig0 or aSig1 ) = 0 ) result := packFloat128( zSign, 0, 0, 0 );
			
 
				+        normalizeFloat128Subnormal( aSig0, aSig1, &aExp, &aSig0, &aSig1 );
			
 
				+    end;
			
 
				+    if ( bExp = 0 ) begin
			
 
				+        if ( ( bSig0 or bSig1 ) = 0 ) result := packFloat128( zSign, 0, 0, 0 );
			
 
				+        normalizeFloat128Subnormal( bSig0, bSig1, &bExp, &bSig0, &bSig1 );
			
 
				+    end;
			
 
				+    zExp := aExp + bExp - $4000;
			
 
				+    aSig0 or= LIT64( $0001000000000000 );
			
 
				+    shortShift128Left( bSig0, bSig1, 16, &bSig0, &bSig1 );
			
 
				+    mul128To256( aSig0, aSig1, bSig0, bSig1, &zSig0, &zSig1, &zSig2, &zSig3 );
			
 
				+    add128( zSig0, zSig1, aSig0, aSig1, &zSig0, &zSig1 );
			
 
				+    zSig2 or= ( zSig3 <> 0 );
			
 
				+    if ( LIT64( $0002000000000000 ) <= zSig0 ) begin
			
 
				+        shift128ExtraRightJamming(
			
 
				+            zSig0, zSig1, zSig2, 1, &zSig0, &zSig1, &zSig2 );
			
 
				+        ++zExp;
			
 
				+    end;
			
 
				+    result := roundAndPackFloat128( zSign, zExp, zSig0, zSig1, zSig2 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the result of dividing the quadruple-precision floating-point value
			
 
				+| `a' by the corresponding value `b'.  The operation is performed according to
			
 
				+| the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_div(a: float128; b: float128): float128;
			
 
				+begin
			
 
				+    flag aSign, bSign, zSign;
			
 
				+    int32 aExp, bExp, zExp;
			
 
				+    bits64 aSig0, aSig1, bSig0, bSig1, zSig0, zSig1, zSig2;
			
 
				+    bits64 rem0, rem1, rem2, rem3, term0, term1, term2, term3;
			
 
				+    float128 z;
			
 
				+
			
 
				+    aSig1 := extractFloat128Frac1( a );
			
 
				+    aSig0 := extractFloat128Frac0( a );
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    bSig1 := extractFloat128Frac1( b );
			
 
				+    bSig0 := extractFloat128Frac0( b );
			
 
				+    bExp := extractFloat128Exp( b );
			
 
				+    bSign := extractFloat128Sign( b );
			
 
				+    zSign := aSign xor bSign;
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if ( aSig0 or aSig1 ) result := propagateFloat128NaN( a, b );
			
 
				+        if ( bExp = $7FFF ) begin
			
 
				+            if ( bSig0 or bSig1 ) result := propagateFloat128NaN( a, b );
			
 
				+            goto invalid;
			
 
				+        end;
			
 
				+        result := packFloat128( zSign, $7FFF, 0, 0 );
			
 
				+    end;
			
 
				+    if ( bExp = $7FFF ) begin
			
 
				+        if ( bSig0 or bSig1 ) result := propagateFloat128NaN( a, b );
			
 
				+        result := packFloat128( zSign, 0, 0, 0 );
			
 
				+    end;
			
 
				+    if ( bExp = 0 ) begin
			
 
				+        if ( ( bSig0 or bSig1 ) = 0 ) begin
			
 
				+            if ( ( aExp or aSig0 or aSig1 ) = 0 ) begin
			
 
				+ invalid:
			
 
				+                float_raise( float_flag_invalid );
			
 
				+                z.low := float128_default_nan_low;
			
 
				+                z.high := float128_default_nan_high;
			
 
				+                result := z;
			
 
				+            end;
			
 
				+            float_raise( float_flag_divbyzero );
			
 
				+            result := packFloat128( zSign, $7FFF, 0, 0 );
			
 
				+        end;
			
 
				+        normalizeFloat128Subnormal( bSig0, bSig1, &bExp, &bSig0, &bSig1 );
			
 
				+    end;
			
 
				+    if ( aExp = 0 ) begin
			
 
				+        if ( ( aSig0 or aSig1 ) = 0 ) result := packFloat128( zSign, 0, 0, 0 );
			
 
				+        normalizeFloat128Subnormal( aSig0, aSig1, &aExp, &aSig0, &aSig1 );
			
 
				+    end;
			
 
				+    zExp := aExp - bExp + $3FFD;
			
 
				+    shortShift128Left(
			
 
				+        aSig0 or LIT64( $0001000000000000 ), aSig1, 15, &aSig0, &aSig1 );
			
 
				+    shortShift128Left(
			
 
				+        bSig0 or LIT64( $0001000000000000 ), bSig1, 15, &bSig0, &bSig1 );
			
 
				+    if ( le128( bSig0, bSig1, aSig0, aSig1 ) ) begin
			
 
				+        shift128Right( aSig0, aSig1, 1, &aSig0, &aSig1 );
			
 
				+        ++zExp;
			
 
				+    end;
			
 
				+    zSig0 := estimateDiv128To64( aSig0, aSig1, bSig0 );
			
 
				+    mul128By64To192( bSig0, bSig1, zSig0, &term0, &term1, &term2 );
			
 
				+    sub192( aSig0, aSig1, 0, term0, term1, term2, &rem0, &rem1, &rem2 );
			
 
				+    while ( (sbits64) rem0 < 0 ) begin
			
 
				+        --zSig0;
			
 
				+        add192( rem0, rem1, rem2, 0, bSig0, bSig1, &rem0, &rem1, &rem2 );
			
 
				+    end;
			
 
				+    zSig1 := estimateDiv128To64( rem1, rem2, bSig0 );
			
 
				+    if ( ( zSig1 and $3FFF ) <= 4 ) begin
			
 
				+        mul128By64To192( bSig0, bSig1, zSig1, &term1, &term2, &term3 );
			
 
				+        sub192( rem1, rem2, 0, term1, term2, term3, &rem1, &rem2, &rem3 );
			
 
				+        while ( (sbits64) rem1 < 0 ) begin
			
 
				+            --zSig1;
			
 
				+            add192( rem1, rem2, rem3, 0, bSig0, bSig1, &rem1, &rem2, &rem3 );
			
 
				+        end;
			
 
				+        zSig1 or= ( ( rem1 or rem2 or rem3 ) <> 0 );
			
 
				+    end;
			
 
				+    shift128ExtraRightJamming( zSig0, zSig1, 0, 15, &zSig0, &zSig1, &zSig2 );
			
 
				+    result := roundAndPackFloat128( zSign, zExp, zSig0, zSig1, zSig2 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the remainder of the quadruple-precision floating-point value `a'
			
 
				+| with respect to the corresponding value `b'.  The operation is performed
			
 
				+| according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_rem(a: float128; b: float128): float128;
			
 
				+begin
			
 
				+    flag aSign, bSign, zSign;
			
 
				+    int32 aExp, bExp, expDiff;
			
 
				+    bits64 aSig0, aSig1, bSig0, bSig1, q, term0, term1, term2;
			
 
				+    bits64 allZero, alternateASig0, alternateASig1, sigMean1;
			
 
				+    sbits64 sigMean0;
			
 
				+    float128 z;
			
 
				+
			
 
				+    aSig1 := extractFloat128Frac1( a );
			
 
				+    aSig0 := extractFloat128Frac0( a );
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    bSig1 := extractFloat128Frac1( b );
			
 
				+    bSig0 := extractFloat128Frac0( b );
			
 
				+    bExp := extractFloat128Exp( b );
			
 
				+    bSign := extractFloat128Sign( b );
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if (    ( aSig0 or aSig1 )
			
 
				+             or ( ( bExp = $7FFF ) and ( bSig0 or bSig1 ) ) ) begin
			
 
				+            result := propagateFloat128NaN( a, b );
			
 
				+        end;
			
 
				+        goto invalid;
			
 
				+    end;
			
 
				+    if ( bExp = $7FFF ) begin
			
 
				+        if ( bSig0 or bSig1 ) result := propagateFloat128NaN( a, b );
			
 
				+        result := a;
			
 
				+    end;
			
 
				+    if ( bExp = 0 ) begin
			
 
				+        if ( ( bSig0 or bSig1 ) = 0 ) begin
			
 
				+ invalid:
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            z.low := float128_default_nan_low;
			
 
				+            z.high := float128_default_nan_high;
			
 
				+            result := z;
			
 
				+        end;
			
 
				+        normalizeFloat128Subnormal( bSig0, bSig1, &bExp, &bSig0, &bSig1 );
			
 
				+    end;
			
 
				+    if ( aExp = 0 ) begin
			
 
				+        if ( ( aSig0 or aSig1 ) = 0 ) result := a;
			
 
				+        normalizeFloat128Subnormal( aSig0, aSig1, &aExp, &aSig0, &aSig1 );
			
 
				+    end;
			
 
				+    expDiff := aExp - bExp;
			
 
				+    if ( expDiff < -1 ) result := a;
			
 
				+    shortShift128Left(
			
 
				+        aSig0 or LIT64( $0001000000000000 ),
			
 
				+        aSig1,
			
 
				+        15 - ( expDiff < 0 ),
			
 
				+        &aSig0,
			
 
				+        &aSig1
			
 
				+    );
			
 
				+    shortShift128Left(
			
 
				+        bSig0 or LIT64( $0001000000000000 ), bSig1, 15, &bSig0, &bSig1 );
			
 
				+    q := le128( bSig0, bSig1, aSig0, aSig1 );
			
 
				+    if ( q ) sub128( aSig0, aSig1, bSig0, bSig1, &aSig0, &aSig1 );
			
 
				+    expDiff -= 64;
			
 
				+    while ( 0 < expDiff ) begin
			
 
				+        q := estimateDiv128To64( aSig0, aSig1, bSig0 );
			
 
				+        q := ( 4 < q ) ? q - 4 : 0;
			
 
				+        mul128By64To192( bSig0, bSig1, q, &term0, &term1, &term2 );
			
 
				+        shortShift192Left( term0, term1, term2, 61, &term1, &term2, &allZero );
			
 
				+        shortShift128Left( aSig0, aSig1, 61, &aSig0, &allZero );
			
 
				+        sub128( aSig0, 0, term1, term2, &aSig0, &aSig1 );
			
 
				+        expDiff -= 61;
			
 
				+    end;
			
 
				+    if ( -64 < expDiff ) begin
			
 
				+        q := estimateDiv128To64( aSig0, aSig1, bSig0 );
			
 
				+        q := ( 4 < q ) ? q - 4 : 0;
			
 
				+        q >>= - expDiff;
			
 
				+        shift128Right( bSig0, bSig1, 12, &bSig0, &bSig1 );
			
 
				+        expDiff += 52;
			
 
				+        if ( expDiff < 0 ) begin
			
 
				+            shift128Right( aSig0, aSig1, - expDiff, &aSig0, &aSig1 );
			
 
				+        end;
			
 
				+        else begin
			
 
				+            shortShift128Left( aSig0, aSig1, expDiff, &aSig0, &aSig1 );
			
 
				+        end;
			
 
				+        mul128By64To192( bSig0, bSig1, q, &term0, &term1, &term2 );
			
 
				+        sub128( aSig0, aSig1, term1, term2, &aSig0, &aSig1 );
			
 
				+    end;
			
 
				+    else begin
			
 
				+        shift128Right( aSig0, aSig1, 12, &aSig0, &aSig1 );
			
 
				+        shift128Right( bSig0, bSig1, 12, &bSig0, &bSig1 );
			
 
				+    end;
			
 
				+    do begin
			
 
				+        alternateASig0 := aSig0;
			
 
				+        alternateASig1 := aSig1;
			
 
				+        ++q;
			
 
				+        sub128( aSig0, aSig1, bSig0, bSig1, &aSig0, &aSig1 );
			
 
				+    end; while ( 0 <= (sbits64) aSig0 );
			
 
				+    add128(
			
 
				+        aSig0, aSig1, alternateASig0, alternateASig1, &sigMean0, &sigMean1 );
			
 
				+    if (    ( sigMean0 < 0 )
			
 
				+         or ( ( ( sigMean0 or sigMean1 ) = 0 ) and ( q and 1 ) ) ) begin
			
 
				+        aSig0 := alternateASig0;
			
 
				+        aSig1 := alternateASig1;
			
 
				+    end;
			
 
				+    zSign := ( (sbits64) aSig0 < 0 );
			
 
				+    if ( zSign ) sub128( 0, 0, aSig0, aSig1, &aSig0, &aSig1 );
			
 
				+    result :=
			
 
				+        normalizeRoundAndPackFloat128( aSign xor zSign, bExp - 4, aSig0, aSig1 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns the square root of the quadruple-precision floating-point value `a'.
			
 
				+| The operation is performed according to the IEC/IEEE Standard for Binary
			
 
				+| Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_sqrt(a: float128): float128;
			
 
				+begin
			
 
				+    flag aSign;
			
 
				+    int32 aExp, zExp;
			
 
				+    bits64 aSig0, aSig1, zSig0, zSig1, zSig2, doubleZSig0;
			
 
				+    bits64 rem0, rem1, rem2, rem3, term0, term1, term2, term3;
			
 
				+    float128 z;
			
 
				+
			
 
				+    aSig1 := extractFloat128Frac1( a );
			
 
				+    aSig0 := extractFloat128Frac0( a );
			
 
				+    aExp := extractFloat128Exp( a );
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    if ( aExp = $7FFF ) begin
			
 
				+        if ( aSig0 or aSig1 ) result := propagateFloat128NaN( a, a );
			
 
				+        if ( ! aSign ) result := a;
			
 
				+        goto invalid;
			
 
				+    end;
			
 
				+    if ( aSign ) begin
			
 
				+        if ( ( aExp or aSig0 or aSig1 ) = 0 ) result := a;
			
 
				+ invalid:
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        z.low := float128_default_nan_low;
			
 
				+        z.high := float128_default_nan_high;
			
 
				+        result := z;
			
 
				+    end;
			
 
				+    if ( aExp = 0 ) begin
			
 
				+        if ( ( aSig0 or aSig1 ) = 0 ) result := packFloat128( 0, 0, 0, 0 );
			
 
				+        normalizeFloat128Subnormal( aSig0, aSig1, &aExp, &aSig0, &aSig1 );
			
 
				+    end;
			
 
				+    zExp := ( ( aExp - $3FFF )>>1 ) + $3FFE;
			
 
				+    aSig0 or= LIT64( $0001000000000000 );
			
 
				+    zSig0 := estimateSqrt32( aExp, aSig0>>17 );
			
 
				+    shortShift128Left( aSig0, aSig1, 13 - ( aExp and 1 ), &aSig0, &aSig1 );
			
 
				+    zSig0 := estimateDiv128To64( aSig0, aSig1, zSig0 shl 32 ) + ( zSig0 shl 30 );
			
 
				+    doubleZSig0 := zSig0 shl 1;
			
 
				+    mul64To128( zSig0, zSig0, &term0, &term1 );
			
 
				+    sub128( aSig0, aSig1, term0, term1, &rem0, &rem1 );
			
 
				+    while ( (sbits64) rem0 < 0 ) begin
			
 
				+        --zSig0;
			
 
				+        doubleZSig0 -= 2;
			
 
				+        add128( rem0, rem1, zSig0>>63, doubleZSig0 or 1, &rem0, &rem1 );
			
 
				+    end;
			
 
				+    zSig1 := estimateDiv128To64( rem1, 0, doubleZSig0 );
			
 
				+    if ( ( zSig1 and $1FFF ) <= 5 ) begin
			
 
				+        if ( zSig1 = 0 ) zSig1 := 1;
			
 
				+        mul64To128( doubleZSig0, zSig1, &term1, &term2 );
			
 
				+        sub128( rem1, 0, term1, term2, &rem1, &rem2 );
			
 
				+        mul64To128( zSig1, zSig1, &term2, &term3 );
			
 
				+        sub192( rem1, rem2, 0, 0, term2, term3, &rem1, &rem2, &rem3 );
			
 
				+        while ( (sbits64) rem1 < 0 ) begin
			
 
				+            --zSig1;
			
 
				+            shortShift128Left( 0, zSig1, 1, &term2, &term3 );
			
 
				+            term3 or= 1;
			
 
				+            term2 or= doubleZSig0;
			
 
				+            add192( rem1, rem2, rem3, 0, term2, term3, &rem1, &rem2, &rem3 );
			
 
				+        end;
			
 
				+        zSig1 or= ( ( rem1 or rem2 or rem3 ) <> 0 );
			
 
				+    end;
			
 
				+    shift128ExtraRightJamming( zSig0, zSig1, 0, 14, &zSig0, &zSig1, &zSig2 );
			
 
				+    result := roundAndPackFloat128( 0, zExp, zSig0, zSig1, zSig2 );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the quadruple-precision floating-point value `a' is equal to
			
 
				+| the corresponding value `b', and 0 otherwise.  The comparison is performed
			
 
				+| according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_eq(a: float128; b: float128): flag;
			
 
				+begin
			
 
				+
			
 
				+    if (    (    ( extractFloat128Exp( a ) = $7FFF )
			
 
				+              and ( extractFloat128Frac0( a ) or extractFloat128Frac1( a ) ) )
			
 
				+         or (    ( extractFloat128Exp( b ) = $7FFF )
			
 
				+              and ( extractFloat128Frac0( b ) or extractFloat128Frac1( b ) ) )
			
 
				+       ) begin
			
 
				+        if (    float128_is_signaling_nan( a )
			
 
				+             or float128_is_signaling_nan( b ) ) begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+        end;
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    result :=
			
 
				+           ( a.low = b.low )
			
 
				+        and (    ( a.high = b.high )
			
 
				+             or (    ( a.low = 0 )
			
 
				+                  and ( (bits64) ( ( a.high or b.high ) shl 1 ) = 0 ) )
			
 
				+           );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the quadruple-precision floating-point value `a' is less than
			
 
				+| or equal to the corresponding value `b', and 0 otherwise.  The comparison
			
 
				+| is performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+| Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_le(a: float128; b: float128): flag;
			
 
				+begin
			
 
				+    flag aSign, bSign;
			
 
				+
			
 
				+    if (    (    ( extractFloat128Exp( a ) = $7FFF )
			
 
				+              and ( extractFloat128Frac0( a ) or extractFloat128Frac1( a ) ) )
			
 
				+         or (    ( extractFloat128Exp( b ) = $7FFF )
			
 
				+              and ( extractFloat128Frac0( b ) or extractFloat128Frac1( b ) ) )
			
 
				+       ) begin
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    bSign := extractFloat128Sign( b );
			
 
				+    if ( aSign <> bSign ) begin
			
 
				+        result :=
			
 
				+               aSign
			
 
				+            or (    ( ( (bits64) ( ( a.high or b.high ) shl 1 ) ) or a.low or b.low )
			
 
				+                 = 0 );
			
 
				+    end;
			
 
				+    result :=
			
 
				+          aSign ? le128( b.high, b.low, a.high, a.low )
			
 
				+        : le128( a.high, a.low, b.high, b.low );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the quadruple-precision floating-point value `a' is less than
			
 
				+| the corresponding value `b', and 0 otherwise.  The comparison is performed
			
 
				+| according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_lt(a: float128; b: float128): flag;
			
 
				+begin
			
 
				+    flag aSign, bSign;
			
 
				+
			
 
				+    if (    (    ( extractFloat128Exp( a ) = $7FFF )
			
 
				+              and ( extractFloat128Frac0( a ) or extractFloat128Frac1( a ) ) )
			
 
				+         or (    ( extractFloat128Exp( b ) = $7FFF )
			
 
				+              and ( extractFloat128Frac0( b ) or extractFloat128Frac1( b ) ) )
			
 
				+       ) begin
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    bSign := extractFloat128Sign( b );
			
 
				+    if ( aSign <> bSign ) begin
			
 
				+        result :=
			
 
				+               aSign
			
 
				+            and (    ( ( (bits64) ( ( a.high or b.high ) shl 1 ) ) or a.low or b.low )
			
 
				+                 <> 0 );
			
 
				+    end;
			
 
				+    result :=
			
 
				+          aSign ? lt128( b.high, b.low, a.high, a.low )
			
 
				+        : lt128( a.high, a.low, b.high, b.low );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the quadruple-precision floating-point value `a' is equal to
			
 
				+| the corresponding value `b', and 0 otherwise.  The invalid exception is
			
 
				+| raised if either operand is a NaN.  Otherwise, the comparison is performed
			
 
				+| according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_eq_signaling(a: float128; b: float128): flag;
			
 
				+begin
			
 
				+
			
 
				+    if (    (    ( extractFloat128Exp( a ) = $7FFF )
			
 
				+              and ( extractFloat128Frac0( a ) or extractFloat128Frac1( a ) ) )
			
 
				+         or (    ( extractFloat128Exp( b ) = $7FFF )
			
 
				+              and ( extractFloat128Frac0( b ) or extractFloat128Frac1( b ) ) )
			
 
				+       ) begin
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    result :=
			
 
				+           ( a.low = b.low )
			
 
				+        and (    ( a.high = b.high )
			
 
				+             or (    ( a.low = 0 )
			
 
				+                  and ( (bits64) ( ( a.high or b.high ) shl 1 ) = 0 ) )
			
 
				+           );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the quadruple-precision floating-point value `a' is less than
			
 
				+| or equal to the corresponding value `b', and 0 otherwise.  Quiet NaNs do not
			
 
				+| cause an exception.  Otherwise, the comparison is performed according to the
			
 
				+| IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_le_quiet(a: float128; b: float128): flag;
			
 
				+begin
			
 
				+    flag aSign, bSign;
			
 
				+
			
 
				+    if (    (    ( extractFloat128Exp( a ) = $7FFF )
			
 
				+              and ( extractFloat128Frac0( a ) or extractFloat128Frac1( a ) ) )
			
 
				+         or (    ( extractFloat128Exp( b ) = $7FFF )
			
 
				+              and ( extractFloat128Frac0( b ) or extractFloat128Frac1( b ) ) )
			
 
				+       ) begin
			
 
				+        if (    float128_is_signaling_nan( a )
			
 
				+             or float128_is_signaling_nan( b ) ) begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+        end;
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    bSign := extractFloat128Sign( b );
			
 
				+    if ( aSign <> bSign ) begin
			
 
				+        result :=
			
 
				+               aSign
			
 
				+            or (    ( ( (bits64) ( ( a.high or b.high ) shl 1 ) ) or a.low or b.low )
			
 
				+                 = 0 );
			
 
				+    end;
			
 
				+    result :=
			
 
				+          aSign ? le128( b.high, b.low, a.high, a.low )
			
 
				+        : le128( a.high, a.low, b.high, b.low );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the quadruple-precision floating-point value `a' is less than
			
 
				+| the corresponding value `b', and 0 otherwise.  Quiet NaNs do not cause an
			
 
				+| exception.  Otherwise, the comparison is performed according to the IEC/IEEE
			
 
				+| Standard for Binary Floating-Point Arithmetic.
			
 
				+*----------------------------------------------------------------------------*}
			
 
				+
			
 
				+function float128_lt_quiet(a: float128; b: float128): flag;
			
 
				+begin
			
 
				+    flag aSign, bSign;
			
 
				+
			
 
				+    if (    (    ( extractFloat128Exp( a ) = $7FFF )
			
 
				+              and ( extractFloat128Frac0( a ) or extractFloat128Frac1( a ) ) )
			
 
				+         or (    ( extractFloat128Exp( b ) = $7FFF )
			
 
				+              and ( extractFloat128Frac0( b ) or extractFloat128Frac1( b ) ) )
			
 
				+       ) begin
			
 
				+        if (    float128_is_signaling_nan( a )
			
 
				+             or float128_is_signaling_nan( b ) ) begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+        end;
			
 
				+        result := 0;
			
 
				+    end;
			
 
				+    aSign := extractFloat128Sign( a );
			
 
				+    bSign := extractFloat128Sign( b );
			
 
				+    if ( aSign <> bSign ) begin
			
 
				+        result :=
			
 
				+               aSign
			
 
				+            and (    ( ( (bits64) ( ( a.high or b.high ) shl 1 ) ) or a.low or b.low )
			
 
				+                 <> 0 );
			
 
				+    end;
			
 
				+    result :=
			
 
				+          aSign ? lt128( b.high, b.low, a.high, a.low )
			
 
				+        : lt128( a.high, a.low, b.high, b.low );
			
 
				+
			
 
				+end;
			
 
				+
			
 
				+{$endif FPC_SOFTFLOAT_FLOAT128}
			
 
				+
			
 
				 {$endif not(defined(fpc_softfpu_interface))}
			
 
				 
			
 
				 {$if not(defined(fpc_softfpu_interface)) and not(defined(fpc_softfpu_implementation))}