23 years ago · bf6a6b4d46
--- a/rtl/inc/softfpu.pp
+++ b/rtl/inc/softfpu.pp
@@ -0,0 +1,4494 @@
 
				+
			
 
				+{*
			
 
				+===============================================================================
			
 
				+The original notice of the softfloat package is shown below. The conversion
			
 
				+to pascal was done by Carl Eric Codere in 2002 ([email protected]).
			
 
				+===============================================================================
			
 
				+
			
 
				+This C source file is part of the SoftFloat IEC/IEEE Floating-Point
			
 
				+Arithmetic Package, Release 2a. 
			
 
				+
			
 
				+Written by John R. Hauser.  This work was made possible in part by the
			
 
				+International Computer Science Institute, located at Suite 600, 1947 Center
			
 
				+Street, Berkeley, California 94704.  Funding was partially provided by the
			
 
				+National Science Foundation under grant MIP-9311980.  The original version
			
 
				+of this code was written as part of a project to build a fixed-point vector
			
 
				+processor in collaboration with the University of California at Berkeley,
			
 
				+overseen by Profs. Nelson Morgan and John Wawrzynek.  More information
			
 
				+is available through the Web page 
			
 
				+`http://HTTP.CS.Berkeley.EDU/~jhauser/arithmetic/SoftFloat.html'.
			
 
				+
			
 
				+THIS SOFTWARE IS DISTRIBUTED AS IS, FOR FREE.  Although reasonable effort
			
 
				+has been made to avoid it, THIS SOFTWARE MAY CONTAIN FAULTS THAT WILL AT
			
 
				+TIMES RESULT IN INCORRECT BEHAVIOR.  USE OF THIS SOFTWARE IS RESTRICTED TO
			
 
				+PERSONS AND ORGANIZATIONS WHO CAN AND WILL TAKE FULL RESPONSIBILITY FOR ANY
			
 
				+AND ALL LOSSES, COSTS, OR OTHER PROBLEMS ARISING FROM ITS USE.
			
 
				+
			
 
				+Derivative works are acceptable, even for commercial purposes, so long as
			
 
				+(1) they include prominent notice that the work is derivative, and (2) they
			
 
				+include prominent notice akin to these four paragraphs for those parts of
			
 
				+this code that are retained.
			
 
				+
			
 
				+===============================================================================
			
 
				+*}
			
 
				+
			
 
				+unit softfpu;
			
 
				+
			
 
				+interface
			
 
				+
			
 
				+
			
 
				+{
			
 
				+-------------------------------------------------------------------------------
			
 
				+Software IEC/IEEE floating-point types.
			
 
				+-------------------------------------------------------------------------------
			
 
				+}
			
 
				+TYPE
			
 
				+  float32 = longint;
			
 
				+
			
 
				+  flag = byte;
			
 
				+  uint8 = byte;
			
 
				+  int8 = shortint;
			
 
				+  uint16 = word;
			
 
				+  int16 = integer;
			
 
				+  uint32 = longint;
			
 
				+  int32 = longint;
			
 
				+
			
 
				+  bits8 = byte;
			
 
				+  sbits8 = shortint;
			
 
				+  bits16 = word;
			
 
				+  sbits16 = integer;
			
 
				+  sbits32 = longint;
			
 
				+  bits32 = longint;
			
 
				+{$ifdef ENDIAN_LITTLE}
			
 
				+  float64 = packed record
			
 
				+    low: longword;
			
 
				+    high: longword;
			
 
				+  end;
			
 
				+{$else}
			
 
				+ float64 = packed record
			
 
				+   high,low : longword;
			
 
				+ end;
			
 
				+
			
 
				+{$endif}
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the double-precision floating-point value `a' is less than
			
 
				+the corresponding value `b', and 0 otherwise.  The comparison is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_lt(a: float64;b: float64): flag; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the double-precision floating-point value `a' is less than
			
 
				+or equal to the corresponding value `b', and 0 otherwise.  The comparison
			
 
				+is performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_le(a: float64;b: float64): flag; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the double-precision floating-point value `a' is equal to
			
 
				+the corresponding value `b', and 0 otherwise.  The comparison is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_eq(a: float64;b: float64): flag; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the square root of the double-precision floating-point value `a'.
			
 
				+The operation is performed according to the IEC/IEEE Standard for Binary
			
 
				+Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_sqrt( a: float64; var out: float64 ); 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the remainder of the double-precision floating-point value `a'
			
 
				+with respect to the corresponding value `b'.  The operation is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_rem(a: float64; b : float64; var out: float64); 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of dividing the double-precision floating-point value `a'
			
 
				+by the corresponding value `b'.  The operation is performed according to the
			
 
				+IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_div(a: float64; b : float64 ; var out: float64 ); 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of multiplying the double-precision floating-point values
			
 
				+`a' and `b'.  The operation is performed according to the IEC/IEEE Standard
			
 
				+for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_mul( a: float64; b:float64; Var out: float64); 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of subtracting the double-precision floating-point values
			
 
				+`a' and `b'.  The operation is performed according to the IEC/IEEE Standard
			
 
				+for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_sub(a: float64; b : float64; var out: float64); 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of adding the double-precision floating-point values `a'
			
 
				+and `b'.  The operation is performed according to the IEC/IEEE Standard for
			
 
				+Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_add( a: float64; b : float64; Var out : float64); 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Rounds the double-precision floating-point value `a' to an integer,
			
 
				+and returns the result as a double-precision floating-point value.  The
			
 
				+operation is performed according to the IEC/IEEE Standard for Binary
			
 
				+Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_round_to_int(a: float64; var out: float64 ); 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the double-precision floating-point value
			
 
				+`a' to the single-precision floating-point format.  The conversion is
			
 
				+performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_to_float32(a: float64 ): float32; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the double-precision floating-point value
			
 
				+`a' to the 32-bit two's complement integer format.  The conversion is
			
 
				+performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic, except that the conversion is always rounded toward zero.
			
 
				+If `a' is a NaN, the largest positive integer is returned.  Otherwise, if
			
 
				+the conversion overflows, the largest integer with the same sign as `a' is
			
 
				+returned.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_to_int32_round_to_zero(a: float64 ): int32; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the double-precision floating-point value
			
 
				+`a' to the 32-bit two's complement integer format.  The conversion is
			
 
				+performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic---which means in particular that the conversion is rounded
			
 
				+according to the current rounding mode.  If `a' is a NaN, the largest
			
 
				+positive integer is returned.  Otherwise, if the conversion overflows, the
			
 
				+largest integer with the same sign as `a' is returned.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_to_int32(a: float64): int32; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the single-precision floating-point value `a' is less than
			
 
				+the corresponding value `b', and 0 otherwise.  The comparison is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_lt( a:float32 ; b : float32): flag; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the single-precision floating-point value `a' is less than
			
 
				+or equal to the corresponding value `b', and 0 otherwise.  The comparison
			
 
				+is performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_le( a: float32; b : float32 ):flag; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the single-precision floating-point value `a' is equal to
			
 
				+the corresponding value `b', and 0 otherwise.  The comparison is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_eq( a:float32; b:float32): flag; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the square root of the single-precision floating-point value `a'.
			
 
				+The operation is performed according to the IEC/IEEE Standard for Binary
			
 
				+Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_sqrt(a: float32 ): float32; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the remainder of the single-precision floating-point value `a'
			
 
				+with respect to the corresponding value `b'.  The operation is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_rem(a: float32; b: float32 ):float32; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of dividing the single-precision floating-point value `a'
			
 
				+by the corresponding value `b'.  The operation is performed according to the
			
 
				+IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_div(a: float32;b: float32 ): float32; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of multiplying the single-precision floating-point values
			
 
				+`a' and `b'.  The operation is performed according to the IEC/IEEE Standard
			
 
				+for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_mul(a: float32; b: float32 ) : float32; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of subtracting the single-precision floating-point values
			
 
				+`a' and `b'.  The operation is performed according to the IEC/IEEE Standard
			
 
				+for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_sub( a: float32 ; b:float32 ): float32; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of adding the single-precision floating-point values `a'
			
 
				+and `b'.  The operation is performed according to the IEC/IEEE Standard for
			
 
				+Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_add( a: float32; b:float32 ): float32; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Rounds the single-precision floating-point value `a' to an integer,
			
 
				+and returns the result as a single-precision floating-point value.  The
			
 
				+operation is performed according to the IEC/IEEE Standard for Binary
			
 
				+Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_round_to_int( a: float32): float32; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the single-precision floating-point value
			
 
				+`a' to the double-precision floating-point format.  The conversion is
			
 
				+performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float32_to_float64( a : float32; var out: Float64); 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the single-precision floating-point value
			
 
				+`a' to the 32-bit two's complement integer format.  The conversion is
			
 
				+performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic, except that the conversion is always rounded toward zero.
			
 
				+If `a' is a NaN, the largest positive integer is returned.  Otherwise, if
			
 
				+the conversion overflows, the largest integer with the same sign as `a' is
			
 
				+returned.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_to_int32_round_to_zero( a: Float32 ): int32; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the single-precision floating-point value
			
 
				+`a' to the 32-bit two's complement integer format.  The conversion is
			
 
				+performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic---which means in particular that the conversion is rounded
			
 
				+according to the current rounding mode.  If `a' is a NaN, the largest
			
 
				+positive integer is returned.  Otherwise, if the conversion overflows, the
			
 
				+largest integer with the same sign as `a' is returned.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_to_int32( a : float32) : int32; 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the 32-bit two's complement integer `a' to
			
 
				+the double-precision floating-point format.  The conversion is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure int32_to_float64( a: int32; var c: float64 ); 
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the 32-bit two's complement integer `a' to
			
 
				+the single-precision floating-point format.  The conversion is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function int32_to_float32( a: int32): float32; 
			
 
				+
			
 
				+
			
 
				+CONST
			
 
				+{-------------------------------------------------------------------------------
			
 
				+Software IEC/IEEE floating-point underflow tininess-detection mode.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+    float_tininess_after_rounding  = 0;
			
 
				+    float_tininess_before_rounding = 1;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Software IEC/IEEE floating-point rounding mode.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+{
			
 
				+Round to nearest. 
			
 
				+This is the default mode. It should be used unless there is a specific 
			
 
				+need for one of the others. In this mode results are rounded to the 
			
 
				+nearest representable value. If the result is midway between two 
			
 
				+representable values, the even representable is chosen. Even here 
			
 
				+means the lowest-order bit is zero. This rounding mode prevents 
			
 
				+statistical bias and guarantees numeric stability: round-off errors 
			
 
				+in a lengthy calculation will remain smaller than half of FLT_EPSILON. 
			
 
				+
			
 
				+Round toward plus Infinity. 
			
 
				+All results are rounded to the smallest representable value which is 
			
 
				+greater than the result. 
			
 
				+
			
 
				+Round toward minus Infinity. 
			
 
				+All results are rounded to the largest representable value which is 
			
 
				+less than the result. 
			
 
				+
			
 
				+Round toward zero. 
			
 
				+All results are rounded to the largest representable value whose 
			
 
				+magnitude is less than that of the result. In other words, if the 
			
 
				+result is negative it is rounded up; if it is positive, it is 
			
 
				+rounded down. 
			
 
				+}
			
 
				+    float_round_nearest_even = 0;
			
 
				+    float_round_down         = 1;
			
 
				+    float_round_up           = 2;
			
 
				+    float_round_to_zero      = 3;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Software IEC/IEEE floating-point exception flags.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+    float_flag_invalid   =  1;
			
 
				+    float_flag_divbyzero =  4;
			
 
				+    float_flag_overflow  =  8;
			
 
				+    float_flag_underflow = 16;
			
 
				+    float_flag_inexact   = 32;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Floating-point rounding mode and exception flags.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+const
			
 
				+ float_rounding_mode : Byte = float_round_nearest_even;
			
 
				+ float_exception_flags : Byte = 0;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Underflow tininess-detection mode, statically initialized to default value.
			
 
				+(The declaration in `softfloat.h' must match the `int8' type here.)
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+
			
 
				+const float_detect_tininess: int8 = float_tininess_after_rounding;
			
 
				+
			
 
				+
			
 
				+
			
 
				+
			
 
				+implementation
			
 
				+
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Raises the exceptions specified by `flags'.  Floating-point traps can be
			
 
				+defined here if desired.  It is currently not possible for such a trap
			
 
				+to substitute a result value.  If traps are not implemented, this routine
			
 
				+should be simply `float_exception_flags |= flags;'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+procedure float_raise( i: shortint );
			
 
				+Begin
			
 
				+  float_exception_flags := float_exception_flags or i;
			
 
				+  if (float_exception_flags and float_flag_invalid) <> 0 then
			
 
				+     RunError(207)
			
 
				+  else  
			
 
				+  if (float_exception_flags and float_flag_divbyzero) <> 0 then
			
 
				+     RunError(200)
			
 
				+  else
			
 
				+  if (float_exception_flags and float_flag_overflow) <> 0 then
			
 
				+     RunError(205)
			
 
				+  else
			
 
				+  if (float_exception_flags and float_flag_underflow) <> 0 then
			
 
				+     RunError(206);
			
 
				+end;
			
 
				+
			
 
				+
			
 
				+(*****************************************************************************)
			
 
				+(*----------------------------------------------------------------------------*)
			
 
				+(* Primitive arithmetic functions, including multi-word arithmetic, and       *)
			
 
				+(* division and square root approximations.  (Can be specialized to target if *)
			
 
				+(* desired.)                                                                  *)
			
 
				+(* ---------------------------------------------------------------------------*)
			
 
				+(*****************************************************************************)
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Shifts `a' right by the number of bits given in `count'.  If any nonzero
			
 
				+bits are shifted off, they are ``jammed'' into the least significant bit of
			
 
				+the result by setting the least significant bit to 1.  The value of `count'
			
 
				+can be arbitrarily large; in particular, if `count' is greater than 32, the
			
 
				+result will be either 0 or 1, depending on whether `a' is zero or nonzero.
			
 
				+The result is stored in the location pointed to by `zPtr'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure shift32RightJamming( a: bits32 ; count: int16 ; VAR zPtr :bits32);
			
 
				+var
			
 
				+  z: Bits32;
			
 
				+Begin
			
 
				+    if ( count = 0 ) then
			
 
				+        z := a
			
 
				+   else 
			
 
				+    if ( count < 32 ) then
			
 
				+    Begin
			
 
				+        z := ( a shr count ) or bits32( (( a shl ( ( - count ) AND 31 )) ) <> 0);
			
 
				+    End
			
 
				+   else
			
 
				+    Begin
			
 
				+        z := bits32( a <> 0 );
			
 
				+    End;
			
 
				+    zPtr := z;
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Shifts the 64-bit value formed by concatenating `a0' and `a1' right by the
			
 
				+number of bits given in `count'.  Any bits shifted off are lost.  The value
			
 
				+of `count' can be arbitrarily large; in particular, if `count' is greater
			
 
				+than 64, the result will be 0.  The result is broken into two 32-bit pieces
			
 
				+which are stored at the locations pointed to by `z0Ptr' and `z1Ptr'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure
			
 
				+ shift64Right(
			
 
				+     a0 :bits32; a1: bits32; count:int16; VAR z0Ptr:bits32; VAR z1Ptr:bits32);
			
 
				+Var
			
 
				+  z0, z1: bits32;
			
 
				+  negCount : int8;
			
 
				+Begin
			
 
				+    negCount := ( - count ) AND 31;
			
 
				+
			
 
				+    if ( count = 0 ) then
			
 
				+    Begin
			
 
				+        z1 := a1;
			
 
				+        z0 := a0;
			
 
				+    End
			
 
				+    else if ( count < 32 ) then
			
 
				+    Begin
			
 
				+        z1 := ( a0 shl negCount ) OR ( a1 shr count );
			
 
				+        z0 := a0 shr count;
			
 
				+    End
			
 
				+   else
			
 
				+    Begin
			
 
				+        if (count < 64) then
			
 
				+          z1 := ( a0 shr ( count AND 31 ) )
			
 
				+        else
			
 
				+          z1 := 0;
			
 
				+        z0 := 0;
			
 
				+    End;
			
 
				+    z1Ptr := z1;
			
 
				+    z0Ptr := z0;
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Shifts the 64-bit value formed by concatenating `a0' and `a1' right by the
			
 
				+number of bits given in `count'.  If any nonzero bits are shifted off, they
			
 
				+are ``jammed'' into the least significant bit of the result by setting the
			
 
				+least significant bit to 1.  The value of `count' can be arbitrarily large;
			
 
				+in particular, if `count' is greater than 64, the result will be either 0
			
 
				+or 1, depending on whether the concatenation of `a0' and `a1' is zero or
			
 
				+nonzero.  The result is broken into two 32-bit pieces which are stored at
			
 
				+the locations pointed to by `z0Ptr' and `z1Ptr'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure
			
 
				+ shift64RightJamming(
			
 
				+     a0:bits32; a1: bits32; count:int16; VAR Z0Ptr :bits32;VAR z1Ptr: bits32 );
			
 
				+VAR
			
 
				+    z0, z1 : bits32;
			
 
				+    negCount : int8;
			
 
				+Begin
			
 
				+    negCount := ( - count ) AND 31;
			
 
				+
			
 
				+    if ( count = 0 ) then
			
 
				+    Begin
			
 
				+        z1 := a1;
			
 
				+        z0 := a0;
			
 
				+    End
			
 
				+   else 
			
 
				+    if ( count < 32 ) then
			
 
				+    Begin
			
 
				+        z1 := ( a0 shl negCount ) OR ( a1 shr count ) OR bits32( ( a1 shl negCount ) <> 0 );
			
 
				+        z0 := a0 shr count;
			
 
				+    End
			
 
				+   else
			
 
				+    Begin
			
 
				+        if ( count = 32 ) then
			
 
				+        Begin
			
 
				+            z1 := a0 OR bits32( a1 <> 0 );
			
 
				+        End
			
 
				+       else 
			
 
				+        if ( count < 64 ) Then
			
 
				+        Begin
			
 
				+            z1 := ( a0 shr ( count AND 31 ) ) OR bits32( ( ( a0 shl negCount ) OR a1 ) <> 0 );
			
 
				+        End
			
 
				+       else
			
 
				+        Begin
			
 
				+            z1 := bits32( ( a0 OR a1 ) <> 0 );
			
 
				+        End;
			
 
				+        z0 := 0;
			
 
				+    End;
			
 
				+    z1Ptr := z1;
			
 
				+    z0Ptr := z0;
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Shifts the 96-bit value formed by concatenating `a0', `a1', and `a2' right
			
 
				+by 32 _plus_ the number of bits given in `count'.  The shifted result is
			
 
				+at most 64 nonzero bits; these are broken into two 32-bit pieces which are
			
 
				+stored at the locations pointed to by `z0Ptr' and `z1Ptr'.  The bits shifted
			
 
				+off form a third 32-bit result as follows:  The _last_ bit shifted off is
			
 
				+the most-significant bit of the extra result, and the other 31 bits of the
			
 
				+extra result are all zero if and only if _all_but_the_last_ bits shifted off
			
 
				+were all zero.  This extra result is stored in the location pointed to by
			
 
				+`z2Ptr'.  The value of `count' can be arbitrarily large.
			
 
				+    (This routine makes more sense if `a0', `a1', and `a2' are considered
			
 
				+to form a fixed-point value with binary point between `a1' and `a2'.  This
			
 
				+fixed-point value is shifted right by the number of bits given in `count',
			
 
				+and the integer part of the result is returned at the locations pointed to
			
 
				+by `z0Ptr' and `z1Ptr'.  The fractional part of the result may be slightly
			
 
				+corrupted as described above, and is returned at the location pointed to by
			
 
				+`z2Ptr'.)
			
 
				+-------------------------------------------------------------------------------
			
 
				+}
			
 
				+Procedure
			
 
				+ shift64ExtraRightJamming(
			
 
				+     a0: bits32;
			
 
				+     a1: bits32;
			
 
				+     a2: bits32;
			
 
				+     count: int16;
			
 
				+     VAR z0Ptr: bits32;
			
 
				+     VAR z1Ptr: bits32;
			
 
				+     VAR z2Ptr: bits32
			
 
				+ );
			
 
				+Var
			
 
				+    z0, z1, z2: bits32;
			
 
				+    negCount : int8;
			
 
				+Begin
			
 
				+    negCount := ( - count ) AND 31;
			
 
				+
			
 
				+    if ( count = 0 ) then
			
 
				+    Begin
			
 
				+        z2 := a2;
			
 
				+        z1 := a1;
			
 
				+        z0 := a0;
			
 
				+    End
			
 
				+   else
			
 
				+    Begin
			
 
				+        if ( count < 32 ) Then
			
 
				+        Begin
			
 
				+            z2 := a1 shl negCount;
			
 
				+            z1 := ( a0 shl negCount ) OR ( a1 shr count );
			
 
				+            z0 := a0 shr count;
			
 
				+        End
			
 
				+       else
			
 
				+        Begin
			
 
				+            if ( count = 32 ) then
			
 
				+            Begin
			
 
				+                z2 := a1;
			
 
				+                z1 := a0;
			
 
				+            End
			
 
				+           else
			
 
				+            Begin
			
 
				+                a2 := a2 or a1;
			
 
				+                if ( count < 64 ) then
			
 
				+                Begin
			
 
				+                    z2 := a0 shl negCount;
			
 
				+                    z1 := a0 shr ( count AND 31 );
			
 
				+                End
			
 
				+               else
			
 
				+                Begin
			
 
				+                    if count = 64 then
			
 
				+                       z2 := a0
			
 
				+                    else
			
 
				+                       z2 := bits32(a0 <> 0);
			
 
				+                    z1 := 0;
			
 
				+                End;
			
 
				+            End;
			
 
				+            z0 := 0;
			
 
				+        End;
			
 
				+        z2 := z2 or bits32( a2 <> 0 );
			
 
				+    End;
			
 
				+    z2Ptr := z2;
			
 
				+    z1Ptr := z1;
			
 
				+    z0Ptr := z0;
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Shifts the 64-bit value formed by concatenating `a0' and `a1' left by the
			
 
				+number of bits given in `count'.  Any bits shifted off are lost.  The value
			
 
				+of `count' must be less than 32.  The result is broken into two 32-bit
			
 
				+pieces which are stored at the locations pointed to by `z0Ptr' and `z1Ptr'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure
			
 
				+ shortShift64Left(
			
 
				+     a0:bits32; a1:bits32; count:int16; VAR z0Ptr:bits32; VAR z1Ptr:bits32 );
			
 
				+Begin
			
 
				+
			
 
				+    z1Ptr := a1 shl count;
			
 
				+    if count = 0 then
			
 
				+      z0Ptr := a0
			
 
				+    else
			
 
				+      z0Ptr := ( a0 shl count ) OR ( a1 shr ( ( - count ) AND 31 ) );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Shifts the 96-bit value formed by concatenating `a0', `a1', and `a2' left
			
 
				+by the number of bits given in `count'.  Any bits shifted off are lost.
			
 
				+The value of `count' must be less than 32.  The result is broken into three
			
 
				+32-bit pieces which are stored at the locations pointed to by `z0Ptr',
			
 
				+`z1Ptr', and `z2Ptr'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure
			
 
				+ shortShift96Left(
			
 
				+     a0: bits32;
			
 
				+     a1: bits32;
			
 
				+     a2: bits32;
			
 
				+     count: int16;
			
 
				+     VAR z0Ptr: bits32;
			
 
				+     VAR z1Ptr: bits32;
			
 
				+     VAR z2Ptr: bits32
			
 
				+ );
			
 
				+Var
			
 
				+    z0, z1, z2: bits32;
			
 
				+    negCount: int8;
			
 
				+Begin
			
 
				+    z2 := a2 shl count;
			
 
				+    z1 := a1 shl count;
			
 
				+    z0 := a0 shl count;
			
 
				+    if ( 0 < count ) then
			
 
				+    Begin
			
 
				+        negCount := ( ( - count ) AND 31 );
			
 
				+        z1 := z1 or (a2 shr negCount);
			
 
				+        z0 := z0 or (a1 shr negCount);
			
 
				+    End;
			
 
				+    z2Ptr := z2;
			
 
				+    z1Ptr := z1;
			
 
				+    z0Ptr := z0;
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Adds the 64-bit value formed by concatenating `a0' and `a1' to the 64-bit
			
 
				+value formed by concatenating `b0' and `b1'.  Addition is modulo 2^64, so
			
 
				+any carry out is lost.  The result is broken into two 32-bit pieces which
			
 
				+are stored at the locations pointed to by `z0Ptr' and `z1Ptr'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure
			
 
				+ add64(
			
 
				+     a0:bits32; a1:bits32; b0:bits32; b1:bits32; VAR z0Ptr:bits32; VAR z1Ptr:bits32 );
			
 
				+Var
			
 
				+    z1: bits32;
			
 
				+Begin
			
 
				+    z1 := a1 + b1;
			
 
				+    z1Ptr := z1;
			
 
				+    z0Ptr := a0 + b0 + bits32( z1 < a1 );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Adds the 96-bit value formed by concatenating `a0', `a1', and `a2' to the
			
 
				+96-bit value formed by concatenating `b0', `b1', and `b2'.  Addition is
			
 
				+modulo 2^96, so any carry out is lost.  The result is broken into three
			
 
				+32-bit pieces which are stored at the locations pointed to by `z0Ptr',
			
 
				+`z1Ptr', and `z2Ptr'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure
			
 
				+ add96(
			
 
				+     a0: bits32;
			
 
				+     a1: bits32;
			
 
				+     a2: bits32;
			
 
				+     b0: bits32;
			
 
				+     b1: bits32;
			
 
				+     b2: bits32;
			
 
				+     VAR z0Ptr: bits32;
			
 
				+     VAR z1Ptr: bits32;
			
 
				+     VAR z2Ptr: bits32
			
 
				+ );
			
 
				+var
			
 
				+    z0, z1, z2: bits32;
			
 
				+    carry0, carry1: int8;
			
 
				+Begin
			
 
				+    z2 := a2 + b2;
			
 
				+    carry1 := int8( z2 < a2 );
			
 
				+    z1 := a1 + b1;
			
 
				+    carry0 := int8( z1 < a1 );
			
 
				+    z0 := a0 + b0;
			
 
				+    z1 := z1 + carry1;
			
 
				+    z0 := z0 + bits32( z1 < carry1 );
			
 
				+    z0 := z0 + carry0;
			
 
				+    z2Ptr := z2;
			
 
				+    z1Ptr := z1;
			
 
				+    z0Ptr := z0;
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Subtracts the 64-bit value formed by concatenating `b0' and `b1' from the
			
 
				+64-bit value formed by concatenating `a0' and `a1'.  Subtraction is modulo
			
 
				+2^64, so any borrow out (carry out) is lost.  The result is broken into two
			
 
				+32-bit pieces which are stored at the locations pointed to by `z0Ptr' and
			
 
				+`z1Ptr'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure
			
 
				+ sub64(
			
 
				+     a0: bits32; a1 : bits32; b0 :bits32; b1: bits32; VAR z0Ptr:bits32; VAR z1Ptr: bits32 );
			
 
				+Begin
			
 
				+    z1Ptr := a1 - b1;
			
 
				+    z0Ptr := a0 - b0 - bits32( a1 < b1 );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Subtracts the 96-bit value formed by concatenating `b0', `b1', and `b2' from
			
 
				+the 96-bit value formed by concatenating `a0', `a1', and `a2'.  Subtraction
			
 
				+is modulo 2^96, so any borrow out (carry out) is lost.  The result is broken
			
 
				+into three 32-bit pieces which are stored at the locations pointed to by
			
 
				+`z0Ptr', `z1Ptr', and `z2Ptr'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure
			
 
				+ sub96(
			
 
				+     a0:bits32;
			
 
				+     a1:bits32;
			
 
				+     a2:bits32;
			
 
				+     b0:bits32;
			
 
				+     b1:bits32;
			
 
				+     b2:bits32;
			
 
				+     VAR z0Ptr:bits32;
			
 
				+     VAR z1Ptr:bits32;
			
 
				+     VAR z2Ptr:bits32
			
 
				+ );
			
 
				+Var
			
 
				+    z0, z1, z2: bits32;
			
 
				+    borrow0, borrow1: int8;
			
 
				+Begin
			
 
				+    z2 := a2 - b2;
			
 
				+    borrow1 := int8( a2 < b2 );
			
 
				+    z1 := a1 - b1;
			
 
				+    borrow0 := int8( a1 < b1 );
			
 
				+    z0 := a0 - b0;
			
 
				+    z0 := z0 - bits32( z1 < borrow1 );
			
 
				+    z1 := z1 - borrow1;
			
 
				+    z0 := z0 -borrow0;
			
 
				+    z2Ptr := z2;
			
 
				+    z1Ptr := z1;
			
 
				+    z0Ptr := z0;
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Multiplies `a' by `b' to obtain a 64-bit product.  The product is broken
			
 
				+into two 32-bit pieces which are stored at the locations pointed to by
			
 
				+`z0Ptr' and `z1Ptr'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure mul32To64( a:bits32; b:bits32; VAR z0Ptr: bits32; VAR z1Ptr
			
 
				+:bits32 );
			
 
				+Var
			
 
				+    aHigh, aLow, bHigh, bLow: bits16;
			
 
				+    z0, zMiddleA, zMiddleB, z1: bits32;
			
 
				+Begin
			
 
				+    aLow := a;
			
 
				+    aHigh := a shr 16;
			
 
				+    bLow := b;
			
 
				+    bHigh := b shr 16;
			
 
				+    z1 := ( bits32( aLow) ) * bLow;
			
 
				+    zMiddleA := ( bits32 (aLow) ) * bHigh;
			
 
				+    zMiddleB := ( bits32 (aHigh) ) * bLow;
			
 
				+    z0 := ( bits32 (aHigh) ) * bHigh;
			
 
				+    zMiddleA := zMiddleA + zMiddleB;
			
 
				+    z0 := z0 + ( ( bits32 ( zMiddleA < zMiddleB ) ) shl 16 ) + ( zMiddleA shr 16 );
			
 
				+    zMiddleA := zmiddleA shl 16;
			
 
				+    z1 := z1 + zMiddleA;
			
 
				+    z0 := z0 + bits32( z1 < zMiddleA );
			
 
				+    z1Ptr := z1;
			
 
				+    z0Ptr := z0;
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Multiplies the 64-bit value formed by concatenating `a0' and `a1' by `b'
			
 
				+to obtain a 96-bit product.  The product is broken into three 32-bit pieces
			
 
				+which are stored at the locations pointed to by `z0Ptr', `z1Ptr', and
			
 
				+`z2Ptr'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure
			
 
				+ mul64By32To96(
			
 
				+     a0:bits32;
			
 
				+     a1:bits32;
			
 
				+     b:bits32;
			
 
				+     VAR z0Ptr:bits32;
			
 
				+     VAR z1Ptr:bits32;
			
 
				+     VAR z2Ptr:bits32
			
 
				+ );
			
 
				+Var
			
 
				+    z0, z1, z2, more1: bits32;
			
 
				+Begin
			
 
				+    mul32To64( a1, b, z1, z2 );
			
 
				+    mul32To64( a0, b, z0, more1 );
			
 
				+    add64( z0, more1, 0, z1, z0, z1 );
			
 
				+    z2Ptr := z2;
			
 
				+    z1Ptr := z1;
			
 
				+    z0Ptr := z0;
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Multiplies the 64-bit value formed by concatenating `a0' and `a1' to the
			
 
				+64-bit value formed by concatenating `b0' and `b1' to obtain a 128-bit
			
 
				+product.  The product is broken into four 32-bit pieces which are stored at
			
 
				+the locations pointed to by `z0Ptr', `z1Ptr', `z2Ptr', and `z3Ptr'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure
			
 
				+ mul64To128(
			
 
				+     a0:bits32;
			
 
				+     a1:bits32;
			
 
				+     b0:bits32;
			
 
				+     b1:bits32;
			
 
				+     VAR z0Ptr:bits32;
			
 
				+     VAR z1Ptr:bits32;
			
 
				+     VAR z2Ptr:bits32;
			
 
				+     VAR z3Ptr:bits32
			
 
				+ );
			
 
				+Var
			
 
				+    z0, z1, z2, z3: bits32;
			
 
				+    more1, more2: bits32;
			
 
				+Begin
			
 
				+
			
 
				+    mul32To64( a1, b1, z2, z3 );
			
 
				+    mul32To64( a1, b0, z1, more2 );
			
 
				+    add64( z1, more2, 0, z2, z1, z2 );
			
 
				+    mul32To64( a0, b0, z0, more1 );
			
 
				+    add64( z0, more1, 0, z1, z0, z1 );
			
 
				+    mul32To64( a0, b1, more1, more2 );
			
 
				+    add64( more1, more2, 0, z2, more1, z2 );
			
 
				+    add64( z0, z1, 0, more1, z0, z1 );
			
 
				+    z3Ptr := z3;
			
 
				+    z2Ptr := z2;
			
 
				+    z1Ptr := z1;
			
 
				+    z0Ptr := z0;
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns an approximation to the 32-bit integer quotient obtained by dividing
			
 
				+`b' into the 64-bit value formed by concatenating `a0' and `a1'.  The
			
 
				+divisor `b' must be at least 2^31.  If q is the exact quotient truncated
			
 
				+toward zero, the approximation returned lies between q and q + 2 inclusive.
			
 
				+If the exact quotient q is larger than 32 bits, the maximum positive 32-bit
			
 
				+unsigned integer is returned.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function estimateDiv64To32( a0:bits32; a1: bits32; b:bits32): bits32;
			
 
				+Var
			
 
				+    b0, b1: bits32;
			
 
				+    rem0, rem1, term0, term1: bits32;
			
 
				+    z: bits32;
			
 
				+Begin
			
 
				+    if ( b <= a0 ) then
			
 
				+    Begin
			
 
				+       estimateDiv64To32 := $FFFFFFFF;
			
 
				+       exit;
			
 
				+    End;
			
 
				+    b0 := b shr 16;
			
 
				+    if ( b0 shl 16 <= a0 ) then
			
 
				+       z:= $FFFF0000
			
 
				+     else
			
 
				+       z:= ( a0 div b0 ) shl 16;
			
 
				+    mul32To64( b, z, term0, term1 );
			
 
				+    sub64( a0, a1, term0, term1, rem0, rem1 );
			
 
				+    while ( ( sbits32 (rem0) ) < 0 ) do
			
 
				+    Begin
			
 
				+        z := z - $10000;
			
 
				+        b1 := b shl 16;
			
 
				+        add64( rem0, rem1, b0, b1, rem0, rem1 );
			
 
				+    End;
			
 
				+    rem0 := ( rem0 shl 16 ) OR ( rem1 shr 16 );
			
 
				+    if ( b0 shl 16 <= rem0 ) then
			
 
				+      z := z or $FFFF
			
 
				+    else
			
 
				+      z := z or (rem0 div b0);
			
 
				+    estimateDiv64To32 := z;
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns an approximation to the square root of the 32-bit significand given
			
 
				+by `a'.  Considered as an integer, `a' must be at least 2^31.  If bit 0 of
			
 
				+`aExp' (the least significant bit) is 1, the integer returned approximates
			
 
				+2^31*sqrt(`a'/2^31), where `a' is considered an integer.  If bit 0 of `aExp'
			
 
				+is 0, the integer returned approximates 2^31*sqrt(`a'/2^30).  In either
			
 
				+case, the approximation returned lies strictly within +/-2 of the exact
			
 
				+value.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function estimateSqrt32( aExp: int16; a: bits32 ): bits32;
			
 
				+    const sqrtOddAdjustments: array[0..15] of bits16 = (
			
 
				+        $0004, $0022, $005D, $00B1, $011D, $019F, $0236, $02E0,
			
 
				+        $039C, $0468, $0545, $0631, $072B, $0832, $0946, $0A67
			
 
				+    );
			
 
				+    const sqrtEvenAdjustments: array[0..15] of bits16 = (
			
 
				+        $0A2D, $08AF, $075A, $0629, $051A, $0429, $0356, $029E,
			
 
				+        $0200, $0179, $0109, $00AF, $0068, $0034, $0012, $0002
			
 
				+    );
			
 
				+Var
			
 
				+    index: int8;
			
 
				+    z: bits32;
			
 
				+Begin
			
 
				+
			
 
				+    index := ( a shr 27 ) AND 15;
			
 
				+    if ( aExp AND 1 ) <> 0  then
			
 
				+    Begin
			
 
				+        z := $4000 + ( a shr 17 ) - sqrtOddAdjustments[ index ];
			
 
				+        z := ( ( a div z ) shl 14 ) + ( z shl 15 );
			
 
				+        a := a shr 1;
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        z := $8000 + ( a shr 17 ) - sqrtEvenAdjustments[ index ];
			
 
				+        z := a div z + z;
			
 
				+        if ( $20000 <= z ) then
			
 
				+          z := $FFFF8000
			
 
				+        else
			
 
				+          z := ( z shl 15 );
			
 
				+        if ( z <= a ) then
			
 
				+        Begin
			
 
				+           estimateSqrt32 := bits32 ( ( sbits32 (a )) shr 1 );
			
 
				+           exit;
			
 
				+        End;
			
 
				+    End;
			
 
				+    estimateSqrt32 := ( ( estimateDiv64To32( a, 0, z ) ) shr 1 ) + ( z shr 1 );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the number of leading 0 bits before the most-significant 1 bit of
			
 
				+`a'.  If `a' is zero, 32 is returned.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function countLeadingZeros32( a:bits32 ): int8;
			
 
				+
			
 
				+    const countLeadingZerosHigh:array[0..255] of int8 = (
			
 
				+        8, 7, 6, 6, 5, 5, 5, 5, 4, 4, 4, 4, 4, 4, 4, 4,
			
 
				+        3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
			
 
				+        2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
			
 
				+        2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
			
 
				+        1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
			
 
				+        1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
			
 
				+        1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
			
 
				+        1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
			
 
				+        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
			
 
				+        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
			
 
				+        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
			
 
				+        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
			
 
				+        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
			
 
				+        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
			
 
				+        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
			
 
				+        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0
			
 
				+    );
			
 
				+Var
			
 
				+    shiftCount: int8;
			
 
				+Begin
			
 
				+
			
 
				+    shiftCount := 0;
			
 
				+    if ( a < $10000 ) then
			
 
				+    Begin
			
 
				+        shiftCount := shiftcount + 16;
			
 
				+        a := a shl 16;
			
 
				+    End;
			
 
				+    if ( a < $1000000 ) then
			
 
				+    Begin
			
 
				+        shiftCount := shiftcount + 8;
			
 
				+        a := a shl 8;
			
 
				+    end;
			
 
				+    shiftCount := shiftcount + countLeadingZerosHigh[ a shr 24 ];
			
 
				+    countLeadingZeros32:= shiftCount;
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the 64-bit value formed by concatenating `a0' and `a1' is
			
 
				+equal to the 64-bit value formed by concatenating `b0' and `b1'.  Otherwise,
			
 
				+returns 0.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function eq64( a0: bits32; a1:bits32 ;b0:bits32; b1:bits32 ): flag;
			
 
				+Begin
			
 
				+    eq64 :=  flag( a0 = b0 ) and flag( a1 = b1 );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the 64-bit value formed by concatenating `a0' and `a1' is less
			
 
				+than or equal to the 64-bit value formed by concatenating `b0' and `b1'.
			
 
				+Otherwise, returns 0.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function le64( a0: bits32; a1:bits32 ;b0:bits32; b1:bits32 ): flag;
			
 
				+Begin
			
 
				+
			
 
				+    le64:= flag( a0 < b0 ) or flag( ( a0 = b0 ) and ( a1 <= b1 ) );
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the 64-bit value formed by concatenating `a0' and `a1' is less
			
 
				+than the 64-bit value formed by concatenating `b0' and `b1'.  Otherwise,
			
 
				+returns 0.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function lt64( a0: bits32; a1:bits32 ;b0:bits32; b1:bits32 ): flag;
			
 
				+Begin
			
 
				+    lt64 := flag( a0 < b0 ) or flag( ( a0 = b0 ) and ( a1 < b1 ) );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the 64-bit value formed by concatenating `a0' and `a1' is not
			
 
				+equal to the 64-bit value formed by concatenating `b0' and `b1'.  Otherwise,
			
 
				+returns 0.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function ne64( a0: bits32; a1:bits32 ;b0:bits32; b1:bits32 ): flag;
			
 
				+Begin
			
 
				+    ne64:= flag( a0 <> b0 ) or flag( a1 <> b1 );
			
 
				+End;
			
 
				+
			
 
				+(*****************************************************************************)
			
 
				+(*                      End Low-Level arithmetic                             *)
			
 
				+(*****************************************************************************)
			
 
				+
			
 
				+
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Functions and definitions to determine:  (1) whether tininess for underflow
			
 
				+is detected before or after rounding by default, (2) what (if anything)
			
 
				+happens when exceptions are raised, (3) how signaling NaNs are distinguished
			
 
				+from quiet NaNs, (4) the default generated quiet NaNs, and (4) how NaNs
			
 
				+are propagated from function inputs to output.  These details are ENDIAN
			
 
				+specific
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+{$IFDEF ENDIAN_LITTLE}
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Internal canonical NaN format.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+TYPE
			
 
				+
			
 
				+
			
 
				+ commonNaNT = packed record
			
 
				+   sign: flag;
			
 
				+   high, low : bits32;
			
 
				+ end;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+The pattern for a default generated single-precision NaN.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+const float32_default_nan = $FFC00000;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the single-precision floating-point value `a' is a NaN;
			
 
				+otherwise returns 0.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_is_nan( a : float32 ): flag;
			
 
				+Begin
			
 
				+
			
 
				+    float32_is_nan:= flag( $FF000000 < bits32 ( a shl 1 ) );
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the single-precision floating-point value `a' is a signaling
			
 
				+NaN; otherwise returns 0.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_is_signaling_nan( a : float32  ): flag;
			
 
				+Begin
			
 
				+
			
 
				+    float32_is_signaling_nan := flag
			
 
				+      ( ( ( a shr 22 ) and $1FF ) = $1FE ) and( a and $003FFFFF );
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the single-precision floating-point NaN
			
 
				+`a' to the canonical NaN format.  If `a' is a signaling NaN, the invalid
			
 
				+exception is raised.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float32ToCommonNaN( a: float32; VAR c:commonNaNT  );
			
 
				+var
			
 
				+    z : commonNaNT ;
			
 
				+Begin
			
 
				+    if ( float32_is_signaling_nan( a ) <> 0) then
			
 
				+       float_raise( float_flag_invalid );
			
 
				+    z.sign := a shr 31;
			
 
				+    z.low := 0;
			
 
				+    z.high := a shl 9;
			
 
				+    c := z;
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the canonical NaN `a' to the single-
			
 
				+precision floating-point format.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function commonNaNToFloat32( a : commonNaNT ): float32;
			
 
				+Begin
			
 
				+    commonNaNToFloat32 := ( ( bits32 (a.sign) ) shl 31 ) or $7FC00000 or ( a.high shr 9 );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Takes two single-precision floating-point values `a' and `b', one of which
			
 
				+is a NaN, and returns the appropriate NaN result.  If either `a' or `b' is a
			
 
				+signaling NaN, the invalid exception is raised.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function propagateFloat32NaN( a : float32 ; b: float32 ): float32;
			
 
				+Var
			
 
				+    aIsNaN, aIsSignalingNaN, bIsNaN, bIsSignalingNaN: flag;
			
 
				+label returnLargerSignificand;
			
 
				+Begin
			
 
				+    aIsNaN := float32_is_nan( a );
			
 
				+    aIsSignalingNaN := float32_is_signaling_nan( a );
			
 
				+    bIsNaN := float32_is_nan( b );
			
 
				+    bIsSignalingNaN := float32_is_signaling_nan( b );
			
 
				+    a := a or $00400000;
			
 
				+    b := b or $00400000;
			
 
				+    if ( aIsSignalingNaN or bIsSignalingNaN ) <> 0 then
			
 
				+        float_raise( float_flag_invalid );
			
 
				+    if ( aIsSignalingNaN )<> 0  then
			
 
				+    Begin
			
 
				+        if ( bIsSignalingNaN ) <>  0 then
			
 
				+          goto returnLargerSignificand;
			
 
				+        if bIsNan <> 0 then
			
 
				+          propagateFloat32NaN := b
			
 
				+        else
			
 
				+          propagateFloat32NaN := a;
			
 
				+        exit;
			
 
				+    End
			
 
				+    else if ( aIsNaN <> 0) then
			
 
				+    Begin
			
 
				+        if ( bIsSignalingNaN or not bIsNaN )<> 0 then
			
 
				+        Begin
			
 
				+           propagateFloat32NaN := a;
			
 
				+           exit;
			
 
				+        End;
			
 
				+ returnLargerSignificand:
			
 
				+        if ( bits32 ( a shl 1 ) < bits32 ( b shl 1 ) ) then
			
 
				+        Begin
			
 
				+           propagateFloat32NaN := b;
			
 
				+           exit;
			
 
				+        End;
			
 
				+        if ( bits32 ( b shl 1 ) < bits32 ( a shl 1 ) ) then
			
 
				+        Begin
			
 
				+           propagateFloat32NaN :=  a;
			
 
				+        End;
			
 
				+        if a < b then
			
 
				+          propagateFloat32NaN := a
			
 
				+        else
			
 
				+          propagateFloat32NaN := b;
			
 
				+        exit;
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        propagateFloat32NaN := b;
			
 
				+        exit;
			
 
				+    End;
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+The pattern for a default generated double-precision NaN.  The `high' and
			
 
				+`low' values hold the most- and least-significant bits, respectively.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+const
			
 
				+    float64_default_nan_high = $FFF80000;
			
 
				+    float64_default_nan_low  = $00000000;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the double-precision floating-point value `a' is a NaN;
			
 
				+otherwise returns 0.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_is_nan( a : float64 ) : flag;
			
 
				+Begin
			
 
				+
			
 
				+    float64_is_nan :=
			
 
				+           flag( $FFE00000 <= bits32 ( a.high shl 1 ) )
			
 
				+        and ( a.low or ( a.high and $000FFFFF ) );
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the double-precision floating-point value `a' is a signaling
			
 
				+NaN; otherwise returns 0.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_is_signaling_nan( a : float64 ): flag;
			
 
				+Begin
			
 
				+
			
 
				+    float64_is_signaling_nan :=
			
 
				+           flag( ( ( a.high shr 19 ) and $FFF ) = $FFE )
			
 
				+        and ( a.low or ( a.high and $0007FFFF ) );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the double-precision floating-point NaN
			
 
				+`a' to the canonical NaN format.  If `a' is a signaling NaN, the invalid
			
 
				+exception is raised.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64ToCommonNaN( a : float64; VAR c:commonNaNT );
			
 
				+Var
			
 
				+    z : commonNaNT;
			
 
				+Begin
			
 
				+    if ( float64_is_signaling_nan( a )<>0 ) then
			
 
				+        float_raise( float_flag_invalid );
			
 
				+    z.sign := a.high shr 31;
			
 
				+    shortShift64Left( a.high, a.low, 12, z.high, z.low );
			
 
				+    c := z;
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the canonical NaN `a' to the double-
			
 
				+precision floating-point format.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure commonNaNToFloat64( a : commonNaNT; VAR c: float64  );
			
 
				+Var
			
 
				+    z: float64;
			
 
				+Begin
			
 
				+    shift64Right( a.high, a.low, 12, z.high, z.low );
			
 
				+    z.high := z.high or ( ( bits32 (a.sign) ) shl 31 ) or $7FF80000;
			
 
				+    c := z;
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Takes two double-precision floating-point values `a' and `b', one of which
			
 
				+is a NaN, and returns the appropriate NaN result.  If either `a' or `b' is a
			
 
				+signaling NaN, the invalid exception is raised.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure propagateFloat64NaN( a: float64; b: float64 ; VAR c: float64 );
			
 
				+Var
			
 
				+    aIsNaN, aIsSignalingNaN, bIsNaN, bIsSignalingNaN: flag;
			
 
				+    label returnLargerSignificand;
			
 
				+Begin
			
 
				+    aIsNaN := float64_is_nan( a );
			
 
				+    aIsSignalingNaN := float64_is_signaling_nan( a );
			
 
				+    bIsNaN := float64_is_nan( b );
			
 
				+    bIsSignalingNaN := float64_is_signaling_nan( b );
			
 
				+    a.high := a.high or $00080000;
			
 
				+    b.high := b.high or $00080000;
			
 
				+    if ( aIsSignalingNaN or bIsSignalingNaN )<> 0 then
			
 
				+        float_raise( float_flag_invalid );
			
 
				+    if ( aIsSignalingNaN )<>0 then
			
 
				+    Begin
			
 
				+        if ( bIsSignalingNaN )<>0 then
			
 
				+            goto returnLargerSignificand;
			
 
				+        if bIsNan <> 0 then
			
 
				+           c := b
			
 
				+        else
			
 
				+           c := a;
			
 
				+        exit;
			
 
				+    End
			
 
				+    else if ( aIsNaN )<> 0 then
			
 
				+    Begin
			
 
				+        if ( bIsSignalingNaN or not bIsNaN ) <> 0 then
			
 
				+        Begin
			
 
				+          c := a;
			
 
				+           exit;
			
 
				+        End;
			
 
				+ returnLargerSignificand:
			
 
				+        if ( lt64( a.high shl 1, a.low, b.high shl 1, b.low ) ) <> 0 then
			
 
				+        Begin
			
 
				+           c := b;
			
 
				+           exit;
			
 
				+        End;
			
 
				+        if ( lt64( b.high shl 1, b.low, a.high shl 1, a.low ) ) <> 0 then
			
 
				+        Begin
			
 
				+           c := a;
			
 
				+           exit;
			
 
				+        End;
			
 
				+        if a.high < b.high then
			
 
				+         c := a
			
 
				+        else
			
 
				+         c := b;
			
 
				+        exit;
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        c := b;
			
 
				+        exit;
			
 
				+    End;
			
 
				+End;
			
 
				+{$ELSE}
			
 
				+{ Big endian code }
			
 
				+(*----------------------------------------------------------------------------
			
 
				+| Internal canonical NaN format.
			
 
				+*----------------------------------------------------------------------------*)
			
 
				+ commonNANT = packed record
			
 
				+  sign : flag;
			
 
				+  high, low : bits32;
			
 
				+ end;
			
 
				+ 
			
 
				+(*----------------------------------------------------------------------------
			
 
				+| The pattern for a default generated single-precision NaN.
			
 
				+*----------------------------------------------------------------------------*)
			
 
				+const float32_default_nan = $7FFFFFFF;
			
 
				+
			
 
				+(*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the single-precision floating-point value `a' is a NaN;
			
 
				+| otherwise returns 0.
			
 
				+*----------------------------------------------------------------------------*)
			
 
				+function float32_is_nan(a:  float32): flag;
			
 
				+begin
			
 
				+    float32_is_nan := flag( 0xFF000000 < (bits32) ( a shl 1 ) );
			
 
				+end;
			
 
				+
			
 
				+(*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the single-precision floating-point value `a' is a signaling
			
 
				+| NaN; otherwise returns 0.
			
 
				+*----------------------------------------------------------------------------*)
			
 
				+function float32_is_signaling_nan(a: float32):flag;
			
 
				+ begin
			
 
				+   float32_is_signaling_nan := flag( ( ( a shr 22 ) and $1FF ) = $1FE ) and ( (a and $003FFFFF)<>0 );
			
 
				+ end;
			
 
				+ 
			
 
				+(*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the single-precision floating-point NaN
			
 
				+| `a' to the canonical NaN format.  If `a' is a signaling NaN, the invalid
			
 
				+| exception is raised.
			
 
				+*----------------------------------------------------------------------------*)
			
 
				+Procedure float32ToCommonNaN( a: float32; VAR c:commonNaNT  );
			
 
				+ var 
			
 
				+  z: commonNANT;
			
 
				+ begin
			
 
				+   if float32_is_signaling_nan(a) then
			
 
				+      float_raise(float_flag_invalid);
			
 
				+   z.sign := a shr 31;
			
 
				+   z.low := 0;
			
 
				+   z.high := a shl 9;
			
 
				+   c:=z;
			
 
				+ end;
			
 
				+
			
 
				+(*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the canonical NaN `a' to the single-
			
 
				+| precision floating-point format.
			
 
				+*----------------------------------------------------------------------------*)
			
 
				+function CommonNanToFloat32(a : CommonNaNT): float32;
			
 
				+ begin
			
 
				+    CommonNanToFloat32:= ( ( (bits32) a.sign ) shl 31 ) OR $7FC00000 OR ( a.high shr 9 );
			
 
				+ end;
			
 
				+ 
			
 
				+(*----------------------------------------------------------------------------
			
 
				+| Takes two single-precision floating-point values `a' and `b', one of which
			
 
				+| is a NaN, and returns the appropriate NaN result.  If either `a' or `b' is a
			
 
				+| signaling NaN, the invalid exception is raised.
			
 
				+*----------------------------------------------------------------------------*)
			
 
				+function  propagateFloat32NaN( a: float32 ; b: float32): float32;
			
 
				+ var
			
 
				+  aIsNaN, aIsSignalingNaN, bIsNaN, bIsSignalingNaN: flag;
			
 
				+ begin
			
 
				+    aIsNaN := float32_is_nan( a );
			
 
				+    aIsSignalingNaN := float32_is_signaling_nan( a );
			
 
				+    bIsNaN := float32_is_nan( b );
			
 
				+    bIsSignalingNaN := float32_is_signaling_nan( b );
			
 
				+    a := a or $00400000;
			
 
				+    b := b or $00400000;
			
 
				+    if ( aIsSignalingNaN or bIsSignalingNaN ) then
			
 
				+       float_raise( float_flag_invalid );
			
 
				+    if bIsSignalingNaN<>0 then
			
 
				+        propagateFloat32Nan := b
			
 
				+    else if aIsSignalingNan<>0 then
			
 
				+        propagateFloat32Nan := a
			
 
				+    else if bIsNan<>0 then
			
 
				+        propagateFloat32Nan := b
			
 
				+    else
			
 
				+        propagateFloat32Nan := a;
			
 
				+ end;
			
 
				+
			
 
				+
			
 
				+(*----------------------------------------------------------------------------
			
 
				+| The pattern for a default generated double-precision NaN.  The `high' and
			
 
				+| `low' values hold the most- and least-significant bits, respectively.
			
 
				+*----------------------------------------------------------------------------*)
			
 
				+const
			
 
				+    float64_default_nan_high = $7FFFFFFF;
			
 
				+    float64_default_nan_low  = $FFFFFFFF;
			
 
				+
			
 
				+(*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the double-precision floating-point value `a' is a NaN;
			
 
				+| otherwise returns 0.
			
 
				+*----------------------------------------------------------------------------*)
			
 
				+
			
 
				+function float64_is_nan(a: float64): flag;
			
 
				+ begin
			
 
				+    float_64_is_nan := flag
			
 
				+           ( $FFE00000 <= (bits32) ( a.high shl 1 ) )
			
 
				+        and ( (a.low<>0) or (( a.high and $000FFFFF )<>0) );
			
 
				+ end;
			
 
				+
			
 
				+(*----------------------------------------------------------------------------
			
 
				+| Returns 1 if the double-precision floating-point value `a' is a signaling
			
 
				+| NaN; otherwise returns 0.
			
 
				+*----------------------------------------------------------------------------*)
			
 
				+function float64_is_signaling_nan( a:float64): flag;
			
 
				+ begin
			
 
				+    float64_is_signaling_nan := flag
			
 
				+           ( ( ( a.high shr 19 ) and $FFF ) = $FFE )
			
 
				+        and ( (a.low<>0) or (( a.high and 0x0007FFFF )<>0) );
			
 
				+
			
 
				+ end;
			
 
				+
			
 
				+(*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the double-precision floating-point NaN
			
 
				+| `a' to the canonical NaN format.  If `a' is a signaling NaN, the invalid
			
 
				+| exception is raised.
			
 
				+*----------------------------------------------------------------------------*)
			
 
				+Procedure float64ToCommonNaN( a : float64; VAR c:commonNaNT );
			
 
				+ var
			
 
				+   z : commonNaNT;
			
 
				+ begin
			
 
				+    if ( float64_is_signaling_nan( a )<>0 ) then
			
 
				+        float_raise( float_flag_invalid );
			
 
				+    z.sign = a.high shr 31;
			
 
				+    shortShift64Left( a.high, a.low, 12, z.high, z.low );
			
 
				+    c:=z;
			
 
				+ end;
			
 
				+
			
 
				+(*----------------------------------------------------------------------------
			
 
				+| Returns the result of converting the canonical NaN `a' to the double-
			
 
				+| precision floating-point format.
			
 
				+*----------------------------------------------------------------------------*)
			
 
				+Procedure commonNaNToFloat64( a : commonNaNT; VAR c: float64  );
			
 
				+ var
			
 
				+  z: float64;
			
 
				+ begin
			
 
				+    shift64Right( a.high, a.low, 12, z.high, z.low );
			
 
				+    z.high := z.high or ( ( (bits32) a.sign )<<31 ) | 0x7FF80000;
			
 
				+    c:=z;
			
 
				+ end;
			
 
				+ 
			
 
				+(*----------------------------------------------------------------------------
			
 
				+| Takes two double-precision floating-point values `a' and `b', one of which
			
 
				+| is a NaN, and returns the appropriate NaN result.  If either `a' or `b' is a
			
 
				+| signaling NaN, the invalid exception is raised.
			
 
				+*----------------------------------------------------------------------------*)
			
 
				+Procedure propagateFloat64NaN( a: float64; b: float64 ; VAR c: float64 );
			
 
				+var
			
 
				+ aIsNaN, aIsSignalingNaN, bIsNaN, bIsSignalingNaN : flag;
			
 
				+ begin
			
 
				+    aIsNaN := float64_is_nan( a );
			
 
				+    aIsSignalingNaN := float64_is_signaling_nan( a );
			
 
				+    bIsNaN := float64_is_nan( b );
			
 
				+    bIsSignalingNaN := float64_is_signaling_nan( b );
			
 
				+    a.high := a.high or $00080000;
			
 
				+    b.high := b.high or $00080000;
			
 
				+    if ( aIsSignalingNaN<>0 or bIsSignalingNaN<>0 ) then
			
 
				+       float_raise( float_flag_invalid );
			
 
				+    if bIsSignalingNaN<>0 then
			
 
				+        c := b
			
 
				+    else if aIsSignalingNan<>0 then
			
 
				+        c := a
			
 
				+    else if bIsNan<>0 then
			
 
				+        c := b
			
 
				+    else
			
 
				+        c := a;
			
 
				+ end;
			
 
				+
			
 
				+{$ENDIF} 
			
 
				+
			
 
				+(****************************************************************************)
			
 
				+(*                        END ENDIAN SPECIFIC CODE                          *)
			
 
				+(****************************************************************************)
			
 
				+
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the fraction bits of the single-precision floating-point value `a'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function ExtractFloat32Frac(a : Float32) : Bits32;
			
 
				+ Begin
			
 
				+    ExtractFloat32Frac := A AND $007FFFFF;
			
 
				+ End;
			
 
				+
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the exponent bits of the single-precision floating-point value `a'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function extractFloat32Exp( a: float32 ): Int16;
			
 
				+  Begin
			
 
				+    extractFloat32Exp := (a shr 23) AND $FF;
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the sign bit of the single-precision floating-point value `a'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function extractFloat32Sign( a: float32 ): Flag;
			
 
				+  Begin
			
 
				+    extractFloat32Sign := a shr 31;
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Normalizes the subnormal single-precision floating-point value represented
			
 
				+by the denormalized significand `aSig'.  The normalized exponent and
			
 
				+significand are stored at the locations pointed to by `zExpPtr' and
			
 
				+`zSigPtr', respectively.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure normalizeFloat32Subnormal( aSig : bits32; VAR zExpPtr: Int16; VAR zSigPtr :bits32);
			
 
				+ Var
			
 
				+   ShiftCount : BYTE;
			
 
				+ Begin
			
 
				+
			
 
				+    shiftCount := countLeadingZeros32( aSig ) - 8;
			
 
				+    zSigPtr := aSig shl shiftCount;
			
 
				+    zExpPtr := 1 - shiftCount;
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Packs the sign `zSign', exponent `zExp', and significand `zSig' into a
			
 
				+single-precision floating-point value, returning the result.  After being
			
 
				+shifted into the proper positions, the three fields are simply added
			
 
				+together to form the result.  This means that any integer portion of `zSig'
			
 
				+will be added into the exponent.  Since a properly normalized significand
			
 
				+will have an integer portion equal to 1, the `zExp' input should be 1 less
			
 
				+than the desired result exponent whenever `zSig' is a complete, normalized
			
 
				+significand.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function packFloat32( zSign: Flag; zExp : Int16; zSig: Bits32 ): Float32;
			
 
				+ Begin
			
 
				+
			
 
				+    packFloat32 := ( ( bits32( zSign) ) shl 31 ) + ( ( bits32 (zExp) ) shl 23 )
			
 
				+      + zSig;
			
 
				+ End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Takes an abstract floating-point value having sign `zSign', exponent `zExp',
			
 
				+and significand `zSig', and returns the proper single-precision floating-
			
 
				+point value corresponding to the abstract input.  Ordinarily, the abstract
			
 
				+value is simply rounded and packed into the single-precision format, with
			
 
				+the inexact exception raised if the abstract input cannot be represented
			
 
				+exactly.  However, if the abstract value is too large, the overflow and
			
 
				+inexact exceptions are raised and an infinity or maximal finite value is
			
 
				+returned.  If the abstract value is too small, the input value is rounded to
			
 
				+a subnormal number, and the underflow and inexact exceptions are raised if
			
 
				+the abstract input cannot be represented exactly as a subnormal single-
			
 
				+precision floating-point number.
			
 
				+    The input significand `zSig' has its binary point between bits 30
			
 
				+and 29, which is 7 bits to the left of the usual location.  This shifted
			
 
				+significand must be normalized or smaller.  If `zSig' is not normalized,
			
 
				+`zExp' must be 0; in that case, the result returned is a subnormal number,
			
 
				+and it must not require rounding.  In the usual case that `zSig' is
			
 
				+normalized, `zExp' must be 1 less than the ``true'' floating-point exponent.
			
 
				+The handling of underflow and overflow follows the IEC/IEEE Standard for
			
 
				+Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function roundAndPackFloat32( zSign : Flag; zExp : Int16; zSig : Bits32 ) : float32;
			
 
				+ Var
			
 
				+   roundingMode : BYTE;
			
 
				+   roundNearestEven : Flag;
			
 
				+   roundIncrement, roundBits : BYTE;
			
 
				+   IsTiny : Flag;
			
 
				+ Begin
			
 
				+    roundingMode := float_rounding_mode;
			
 
				+    if (roundingMode = float_round_nearest_even) then
			
 
				+      Begin
			
 
				+        roundNearestEven := Flag(TRUE);
			
 
				+      end
			
 
				+    else
			
 
				+       roundNearestEven := Flag(FALSE);
			
 
				+    roundIncrement := $40;
			
 
				+    if ( Boolean(roundNearestEven)  = FALSE)  then
			
 
				+      Begin
			
 
				+        if ( roundingMode = float_round_to_zero ) Then
			
 
				+          Begin
			
 
				+            roundIncrement := 0;
			
 
				+          End
			
 
				+        else
			
 
				+          Begin
			
 
				+            roundIncrement := $7F;
			
 
				+            if ( zSign <> 0 ) then
			
 
				+              Begin
			
 
				+                if roundingMode = float_round_up then roundIncrement := 0;
			
 
				+              End
			
 
				+            else
			
 
				+              Begin
			
 
				+                if roundingMode = float_round_down then roundIncrement := 0;
			
 
				+              End;
			
 
				+         End
			
 
				+      End;
			
 
				+    roundBits := zSig AND $7F;
			
 
				+    if ($FD <= bits16 (zExp) ) then
			
 
				+     Begin
			
 
				+        if (( $FD < zExp ) OR  ( zExp = $FD ) AND ( sbits32 ( zSig + roundIncrement ) < 0 ) ) then
			
 
				+          Begin
			
 
				+             float_raise( float_flag_overflow OR float_flag_inexact );
			
 
				+             roundAndPackFloat32:=packFloat32( zSign, $FF, 0 ) - Flag( roundIncrement = 0 );
			
 
				+             exit;
			
 
				+          End;
			
 
				+        if ( zExp < 0 ) then
			
 
				+          Begin
			
 
				+            isTiny :=
			
 
				+                   flag(( float_detect_tininess = float_tininess_before_rounding )
			
 
				+                OR ( zExp < -1 )
			
 
				+                OR ( (zSig + roundIncrement) < $80000000 ));
			
 
				+            shift32RightJamming( zSig, - zExp, zSig );
			
 
				+            zExp := 0;
			
 
				+            roundBits := zSig AND $7F;
			
 
				+            if ( (isTiny = flag(TRUE)) and (roundBits<>0) ) then
			
 
				+               float_raise( float_flag_underflow );
			
 
				+          End;
			
 
				+    End;
			
 
				+    if ( roundBits )<> 0 then
			
 
				+       float_exception_flags := float_flag_inexact OR float_exception_flags;
			
 
				+    zSig := ( zSig + roundIncrement ) shr 7;
			
 
				+    zSig := zSig AND not bits32( bits32( ( roundBits XOR $40 ) = 0 ) and roundNearestEven );
			
 
				+    if ( zSig = 0 ) then zExp := 0;
			
 
				+    roundAndPackFloat32 := packFloat32( zSign, zExp, zSig );
			
 
				+    exit;
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Takes an abstract floating-point value having sign `zSign', exponent `zExp',
			
 
				+and significand `zSig', and returns the proper single-precision floating-
			
 
				+point value corresponding to the abstract input.  This routine is just like
			
 
				+`roundAndPackFloat32' except that `zSig' does not have to be normalized.
			
 
				+Bit 31 of `zSig' must be zero, and `zExp' must be 1 less than the ``true''
			
 
				+floating-point exponent.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function normalizeRoundAndPackFloat32( zSign: flag; zExp: int16; zSig:bits32 ): float32;
			
 
				+  Var
			
 
				+    ShiftCount : int8;
			
 
				+  Begin
			
 
				+    shiftCount := countLeadingZeros32( zSig ) - 1;
			
 
				+    normalizeRoundAndPackFloat32 := roundAndPackFloat32( zSign, zExp - shiftCount, zSig shl shiftCount );
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the least-significant 32 fraction bits of the double-precision
			
 
				+floating-point value `a'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function extractFloat64Frac( a: float64 ): bits32;
			
 
				+  Begin
			
 
				+    extractFloat64Frac := a.low;
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the most-significant 20 fraction bits of the double-precision
			
 
				+floating-point value `a'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function extractFloat64Frac0(a: float64): bits32;
			
 
				+  Begin
			
 
				+    extractFloat64Frac0 := a.high and $000FFFFF;
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the least-significant 32 fraction bits of the double-precision
			
 
				+floating-point value `a'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function extractFloat64Frac1(a: float64): bits32;
			
 
				+  Begin
			
 
				+    extractFloat64Frac1 := a.low;
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the exponent bits of the double-precision floating-point value `a'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function extractFloat64Exp(a: float64): int16;
			
 
				+ Begin
			
 
				+    extractFloat64Exp:= ( a.high shr 20 ) AND $7FF;
			
 
				+ End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the sign bit of the double-precision floating-point value `a'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function extractFloat64Sign(a: float64) : flag;
			
 
				+ Begin
			
 
				+    extractFloat64Sign := a.high shr 31;
			
 
				+ End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Normalizes the subnormal double-precision floating-point value represented
			
 
				+by the denormalized significand formed by the concatenation of `aSig0' and
			
 
				+`aSig1'.  The normalized exponent is stored at the location pointed to by
			
 
				+`zExpPtr'.  The most significant 21 bits of the normalized significand are
			
 
				+stored at the location pointed to by `zSig0Ptr', and the least significant
			
 
				+32 bits of the normalized significand are stored at the location pointed to
			
 
				+by `zSig1Ptr'.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure normalizeFloat64Subnormal(
			
 
				+     aSig0: bits32;
			
 
				+     aSig1: bits32;
			
 
				+     VAR zExpPtr : Int16;
			
 
				+     VAR zSig0Ptr : Bits32;
			
 
				+     VAR zSig1Ptr : Bits32
			
 
				+ );
			
 
				+ Var
			
 
				+  ShiftCount : Int8;
			
 
				+ Begin
			
 
				+    if ( aSig0 = 0 ) then
			
 
				+      Begin
			
 
				+        shiftCount := countLeadingZeros32( aSig1 ) - 11;
			
 
				+        if ( shiftCount < 0 ) then
			
 
				+          Begin
			
 
				+            zSig0Ptr := aSig1 shr ( - shiftCount );
			
 
				+            zSig1Ptr := aSig1 shl ( shiftCount AND 31 );
			
 
				+          End
			
 
				+        else
			
 
				+           Begin
			
 
				+            zSig0Ptr := aSig1 shl shiftCount;
			
 
				+            zSig1Ptr := 0;
			
 
				+           End;
			
 
				+        zExpPtr := - shiftCount - 31;
			
 
				+      End
			
 
				+    else
			
 
				+      Begin
			
 
				+        shiftCount := countLeadingZeros32( aSig0 ) - 11;
			
 
				+        shortShift64Left( aSig0, aSig1, shiftCount, zSig0Ptr, zSig1Ptr );
			
 
				+        zExpPtr := 1 - shiftCount;
			
 
				+      End;
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Packs the sign `zSign', the exponent `zExp', and the significand formed by
			
 
				+the concatenation of `zSig0' and `zSig1' into a double-precision floating-
			
 
				+point value, returning the result.  After being shifted into the proper
			
 
				+positions, the three fields `zSign', `zExp', and `zSig0' are simply added
			
 
				+together to form the most significant 32 bits of the result.  This means
			
 
				+that any integer portion of `zSig0' will be added into the exponent.  Since
			
 
				+a properly normalized significand will have an integer portion equal to 1,
			
 
				+the `zExp' input should be 1 less than the desired result exponent whenever
			
 
				+`zSig0' and `zSig1' concatenated form a complete, normalized significand.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure
			
 
				+ packFloat64( zSign: Flag; zExp: Int16; zSig0: Bits32; zSig1 : Bits32; VAR c : float64);
			
 
				+ var
			
 
				+    z: Float64;
			
 
				+ Begin
			
 
				+
			
 
				+    z.low := zSig1;
			
 
				+    z.high := ( ( bits32 (zSign) ) shl 31 ) + ( ( bits32 (zExp) ) shl 20 ) + zSig0;
			
 
				+    c := z;
			
 
				+ End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Takes an abstract floating-point value having sign `zSign', exponent `zExp',
			
 
				+and extended significand formed by the concatenation of `zSig0', `zSig1',
			
 
				+and `zSig2', and returns the proper double-precision floating-point value
			
 
				+corresponding to the abstract input.  Ordinarily, the abstract value is
			
 
				+simply rounded and packed into the double-precision format, with the inexact
			
 
				+exception raised if the abstract input cannot be represented exactly.
			
 
				+However, if the abstract value is too large, the overflow and inexact
			
 
				+exceptions are raised and an infinity or maximal finite value is returned.
			
 
				+If the abstract value is too small, the input value is rounded to a
			
 
				+subnormal number, and the underflow and inexact exceptions are raised if the
			
 
				+abstract input cannot be represented exactly as a subnormal double-precision
			
 
				+floating-point number.
			
 
				+    The input significand must be normalized or smaller.  If the input
			
 
				+significand is not normalized, `zExp' must be 0; in that case, the result
			
 
				+returned is a subnormal number, and it must not require rounding.  In the
			
 
				+usual case that the input significand is normalized, `zExp' must be 1 less
			
 
				+than the ``true'' floating-point exponent.  The handling of underflow and
			
 
				+overflow follows the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure
			
 
				+ roundAndPackFloat64(
			
 
				+     zSign: Flag; zExp: Int16; zSig0: Bits32; zSig1: Bits32; zSig2: Bits32; Var c: Float64 );
			
 
				+ Var
			
 
				+   roundingMode : Int8;
			
 
				+   roundNearestEven, increment, isTiny : Flag;
			
 
				+ Begin
			
 
				+
			
 
				+    roundingMode := float_rounding_mode;
			
 
				+    roundNearestEven := flag( roundingMode = float_round_nearest_even );
			
 
				+    increment := flag( sbits32 (zSig2) < 0 );
			
 
				+    if ( roundNearestEven  = flag(FALSE) ) then
			
 
				+      Begin
			
 
				+        if ( roundingMode = float_round_to_zero ) then
			
 
				+            increment := 0
			
 
				+        else
			
 
				+          Begin
			
 
				+            if ( zSign )<> 0 then
			
 
				+              Begin
			
 
				+                increment := flag( roundingMode = float_round_down ) and zSig2;
			
 
				+              End
			
 
				+            else
			
 
				+              Begin
			
 
				+                increment := flag( roundingMode = float_round_up ) and zSig2;
			
 
				+              End
			
 
				+          End
			
 
				+      End;
			
 
				+    if ( $7FD <= bits16 (zExp) ) then
			
 
				+      Begin
			
 
				+        if (( $7FD < zExp )
			
 
				+             or (( zExp = $7FD )
			
 
				+                  and (eq64( $001FFFFF, $FFFFFFFF, zSig0, zSig1 )<>0)
			
 
				+                  and (increment<>0)
			
 
				+                )
			
 
				+           ) then
			
 
				+           Begin
			
 
				+            float_raise( float_flag_overflow OR  float_flag_inexact );
			
 
				+            if (( roundingMode = float_round_to_zero )
			
 
				+                 or ( (zSign<>0) and ( roundingMode = float_round_up ) )
			
 
				+                 or ( (zSign = 0) and ( roundingMode = float_round_down ) )
			
 
				+               ) then
			
 
				+              Begin
			
 
				+                packFloat64( zSign, $7FE, $000FFFFF, $FFFFFFFF, c );
			
 
				+                exit;
			
 
				+              End;
			
 
				+            packFloat64( zSign, $7FF, 0, 0, c );
			
 
				+            exit;
			
 
				+           End;
			
 
				+        if ( zExp < 0 ) then
			
 
				+           Begin
			
 
				+            isTiny :=
			
 
				+                   flag( float_detect_tininess = float_tininess_before_rounding )
			
 
				+                or flag( zExp < -1 )
			
 
				+                or  flag(increment = 0)
			
 
				+                or flag(lt64( zSig0, zSig1, $001FFFFF, $FFFFFFFF)<>0);
			
 
				+            shift64ExtraRightJamming(
			
 
				+                zSig0, zSig1, zSig2, - zExp, zSig0, zSig1, zSig2 );
			
 
				+            zExp := 0;
			
 
				+            if ( isTiny<>0) and (zSig2<>0 ) then float_raise( float_flag_underflow );
			
 
				+            if ( roundNearestEven )<>0 then
			
 
				+              Begin
			
 
				+                increment := flag( sbits32 (zSig2) < 0 );
			
 
				+              End
			
 
				+            else
			
 
				+              Begin
			
 
				+                if ( zSign )<>0 then
			
 
				+                  Begin
			
 
				+                    increment := flag( roundingMode = float_round_down ) and zSig2;
			
 
				+                  End
			
 
				+                else
			
 
				+                  Begin
			
 
				+                    increment := flag( roundingMode = float_round_up ) and zSig2;
			
 
				+                  End
			
 
				+              End;
			
 
				+        End;
			
 
				+    End;
			
 
				+    if ( zSig2 )<>0 then
			
 
				+       float_exception_flags := float_exception_flags OR  float_flag_inexact;
			
 
				+    if ( increment )<>0 then
			
 
				+      Begin
			
 
				+        add64( zSig0, zSig1, 0, 1, zSig0, zSig1 );
			
 
				+        {!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!}
			
 
				+        zSig1 := zSig1 and not ( flag( zSig2 + zSig2 = 0 ) and roundNearestEven );
			
 
				+      End
			
 
				+    else
			
 
				+      Begin
			
 
				+        if ( ( zSig0 or zSig1 ) = 0 ) then zExp := 0;
			
 
				+      End;
			
 
				+    packFloat64( zSign, zExp, zSig0, zSig1, c );
			
 
				+ End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Takes an abstract floating-point value having sign `zSign', exponent `zExp',
			
 
				+and significand formed by the concatenation of `zSig0' and `zSig1', and
			
 
				+returns the proper double-precision floating-point value corresponding
			
 
				+to the abstract input.  This routine is just like `roundAndPackFloat64'
			
 
				+except that the input significand has fewer bits and does not have to be
			
 
				+normalized.  In all cases, `zExp' must be 1 less than the ``true'' floating-
			
 
				+point exponent.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure
			
 
				+ normalizeRoundAndPackFloat64(
			
 
				+     zSign:flag; zExp:int16; zSig0:bits32; zSig1:bits32; VAR c: float64 );
			
 
				+ Var
			
 
				+   shiftCount : int8;
			
 
				+   zSig2 : bits32;
			
 
				+ Begin
			
 
				+
			
 
				+    if ( zSig0 = 0 ) then
			
 
				+     Begin
			
 
				+        zSig0 := zSig1;
			
 
				+        zSig1 := 0;
			
 
				+        zExp := zExp -32;
			
 
				+     End;
			
 
				+    shiftCount := countLeadingZeros32( zSig0 ) - 11;
			
 
				+    if ( 0 <= shiftCount ) then
			
 
				+      Begin
			
 
				+        zSig2 := 0;
			
 
				+        shortShift64Left( zSig0, zSig1, shiftCount, zSig0, zSig1 );
			
 
				+      End
			
 
				+    else
			
 
				+      Begin
			
 
				+        shift64ExtraRightJamming
			
 
				+          (zSig0, zSig1, 0, - shiftCount, zSig0, zSig1, zSig2 );
			
 
				+      End;
			
 
				+    zExp := zExp - shiftCount;
			
 
				+    roundAndPackFloat64( zSign, zExp, zSig0, zSig1, zSig2, c );
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the 32-bit two's complement integer `a' to
			
 
				+the single-precision floating-point format.  The conversion is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function int32_to_float32( a: int32): float32;
			
 
				+ Var
			
 
				+  zSign : Flag;
			
 
				+ Begin
			
 
				+
			
 
				+    if ( a = 0 ) then
			
 
				+      Begin
			
 
				+       int32_to_float32 := 0;
			
 
				+       exit;
			
 
				+      End;
			
 
				+    if ( a = sbits32 ($80000000) ) then
			
 
				+      Begin
			
 
				+       int32_to_float32 := packFloat32( 1, $9E, 0 );
			
 
				+       exit;
			
 
				+      end;
			
 
				+    zSign := flag( a < 0 );
			
 
				+    If zSign<>0 then
			
 
				+      a := -a;
			
 
				+    int32_to_float32:=
			
 
				+      normalizeRoundAndPackFloat32( zSign, $9C, a );
			
 
				+ End;
			
 
				+
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the 32-bit two's complement integer `a' to
			
 
				+the double-precision floating-point format.  The conversion is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure int32_to_float64( a: int32; var c: float64 );
			
 
				+  var
			
 
				+    zSign : flag;
			
 
				+    absA : bits32;
			
 
				+    shiftCount : int8;
			
 
				+    zSig0, zSig1 : bits32;
			
 
				+  Begin
			
 
				+
			
 
				+    if ( a = 0 ) then
			
 
				+      Begin
			
 
				+       packFloat64( 0, 0, 0, 0, c );
			
 
				+       exit;
			
 
				+      end;
			
 
				+    zSign := flag( a < 0 );
			
 
				+    if ZSign<>0 then
			
 
				+      AbsA := -a
			
 
				+    else
			
 
				+      AbsA := a;
			
 
				+    shiftCount := countLeadingZeros32( absA ) - 11;
			
 
				+    if ( 0 <= shiftCount ) then
			
 
				+      Begin
			
 
				+        zSig0 := absA shl shiftCount;
			
 
				+        zSig1 := 0;
			
 
				+      End
			
 
				+    else
			
 
				+      Begin
			
 
				+        shift64Right( absA, 0, - shiftCount, zSig0, zSig1 );
			
 
				+      End;
			
 
				+    packFloat64( zSign, $412 - shiftCount, zSig0, zSig1,c );
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the single-precision floating-point value
			
 
				+`a' to the 32-bit two's complement integer format.  The conversion is
			
 
				+performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic---which means in particular that the conversion is rounded
			
 
				+according to the current rounding mode.  If `a' is a NaN, the largest
			
 
				+positive integer is returned.  Otherwise, if the conversion overflows, the
			
 
				+largest integer with the same sign as `a' is returned.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_to_int32( a : float32) : int32;
			
 
				+  Var
			
 
				+    aSign: flag;
			
 
				+    aExp, shiftCount: int16;
			
 
				+    aSig, aSigExtra: bits32;
			
 
				+    z: int32;
			
 
				+    roundingMode: int8;
			
 
				+  Begin
			
 
				+
			
 
				+    aSig := extractFloat32Frac( a );
			
 
				+    aExp := extractFloat32Exp( a );
			
 
				+    aSign := extractFloat32Sign( a );
			
 
				+    shiftCount := aExp - $96;
			
 
				+    if ( 0 <= shiftCount ) then
			
 
				+      Begin
			
 
				+        if ( $9E <= aExp ) then
			
 
				+          Begin
			
 
				+            if ( a <> $CF000000 ) then
			
 
				+              Begin
			
 
				+                float_raise( float_flag_invalid );
			
 
				+                if ( (aSign=0) or ( ( aExp = $FF ) and (aSig<>0) ) ) then
			
 
				+                  Begin
			
 
				+                    float32_to_int32 := $7FFFFFFF;
			
 
				+                    exit;
			
 
				+                  End;
			
 
				+              End;
			
 
				+            float32_to_int32 := sbits32 ($80000000);
			
 
				+            exit;
			
 
				+          End;
			
 
				+        z := ( aSig or $00800000 ) shl shiftCount;
			
 
				+        if ( aSign<>0 ) then z := - z;
			
 
				+      End
			
 
				+    else
			
 
				+      Begin
			
 
				+        if ( aExp < $7E ) then
			
 
				+          Begin
			
 
				+            aSigExtra := aExp OR aSig;
			
 
				+            z := 0;
			
 
				+          End
			
 
				+        else
			
 
				+         Begin
			
 
				+            aSig := aSig OR $00800000;
			
 
				+            aSigExtra := aSig shl ( shiftCount and 31 );
			
 
				+            z := aSig shr ( - shiftCount );
			
 
				+         End;
			
 
				+        if ( aSigExtra<>0 ) then
			
 
				+          float_exception_flags := float_exception_flags
			
 
				+             or float_flag_inexact;
			
 
				+        roundingMode := float_rounding_mode;
			
 
				+        if ( roundingMode = float_round_nearest_even ) then
			
 
				+          Begin
			
 
				+            if ( sbits32 (aSigExtra) < 0 ) then
			
 
				+              Begin
			
 
				+                Inc(z);
			
 
				+                if ( bits32 ( aSigExtra shl 1 ) = 0 ) then
			
 
				+                  z := z and not 1;
			
 
				+              End;
			
 
				+              if ( aSign<>0 ) then
			
 
				+                z := - z;
			
 
				+          End
			
 
				+        else
			
 
				+          Begin
			
 
				+            aSigExtra := flag( aSigExtra <> 0 );
			
 
				+            if ( aSign<>0 ) then
			
 
				+             Begin
			
 
				+                z := z + (flag( roundingMode = float_round_down ) and aSigExtra);
			
 
				+                z := - z;
			
 
				+             End
			
 
				+            else
			
 
				+             Begin
			
 
				+                z := z + (flag( roundingMode = float_round_up ) and aSigExtra);
			
 
				+             End
			
 
				+          End;
			
 
				+      End;
			
 
				+   float32_to_int32 := z;
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the single-precision floating-point value
			
 
				+`a' to the 32-bit two's complement integer format.  The conversion is
			
 
				+performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic, except that the conversion is always rounded toward zero.
			
 
				+If `a' is a NaN, the largest positive integer is returned.  Otherwise, if
			
 
				+the conversion overflows, the largest integer with the same sign as `a' is
			
 
				+returned.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_to_int32_round_to_zero( a: Float32 ): int32;
			
 
				+ Var
			
 
				+    aSign : flag;
			
 
				+    aExp, shiftCount : int16;
			
 
				+    aSig : bits32;
			
 
				+    z : int32;
			
 
				+ Begin
			
 
				+    aSig := extractFloat32Frac( a );
			
 
				+    aExp := extractFloat32Exp( a );
			
 
				+    aSign := extractFloat32Sign( a );
			
 
				+    shiftCount := aExp - $9E;
			
 
				+    if ( 0 <= shiftCount ) then
			
 
				+      Begin
			
 
				+        if ( a <> $CF000000 ) then
			
 
				+          Begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            if ( (aSign=0) or ( ( aExp = $FF ) and (aSig<>0) ) ) then
			
 
				+              Begin
			
 
				+                float32_to_int32_round_to_zero := $7FFFFFFF;
			
 
				+                exit;
			
 
				+              end;
			
 
				+          End;
			
 
				+        float32_to_int32_round_to_zero:= sbits32 ($80000000);
			
 
				+        exit;
			
 
				+      End
			
 
				+    else
			
 
				+      if ( aExp <= $7E ) then
			
 
				+      Begin
			
 
				+        if ( aExp or aSig )<>0 then
			
 
				+           float_exception_flags :=
			
 
				+             float_exception_flags or float_flag_inexact;
			
 
				+        float32_to_int32_round_to_zero := 0;
			
 
				+        exit;
			
 
				+      End;
			
 
				+    aSig := ( aSig or $00800000 ) shl 8;
			
 
				+    z := aSig shr ( - shiftCount );
			
 
				+    if ( bits32 ( aSig shl ( shiftCount and 31 ) )<> 0 ) then
			
 
				+      Begin
			
 
				+           float_exception_flags :=
			
 
				+             float_exception_flags or float_flag_inexact;
			
 
				+      End;
			
 
				+    if ( aSign<>0 ) then z := - z;
			
 
				+    float32_to_int32_round_to_zero := z;
			
 
				+ End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the single-precision floating-point value
			
 
				+`a' to the double-precision floating-point format.  The conversion is
			
 
				+performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float32_to_float64( a : float32; var out: Float64);
			
 
				+  Var
			
 
				+    aSign : flag;
			
 
				+    aExp : int16;
			
 
				+    aSig, zSig0, zSig1: bits32;
			
 
				+    tmp : CommonNanT;
			
 
				+  Begin
			
 
				+    aSig := extractFloat32Frac( a );
			
 
				+    aExp := extractFloat32Exp( a );
			
 
				+    aSign := extractFloat32Sign( a );
			
 
				+    if ( aExp = $FF ) then
			
 
				+      Begin
			
 
				+        if ( aSig<>0 ) then
			
 
				+          Begin
			
 
				+            float32ToCommonNaN(a, tmp);
			
 
				+            commonNaNToFloat64(tmp , out);
			
 
				+            exit;
			
 
				+          End;
			
 
				+          packFloat64( aSign, $7FF, 0, 0, out );
			
 
				+          exit;
			
 
				+      End;
			
 
				+    if ( aExp = 0 ) then
			
 
				+      Begin
			
 
				+        if ( aSig = 0 ) then
			
 
				+          Begin
			
 
				+            packFloat64( aSign, 0, 0, 0, out );
			
 
				+            exit;
			
 
				+          end;
			
 
				+        normalizeFloat32Subnormal( aSig, aExp, aSig );
			
 
				+        Dec(aExp);
			
 
				+      End;
			
 
				+    shift64Right( aSig, 0, 3, zSig0, zSig1 );
			
 
				+    packFloat64( aSign, aExp + $380, zSig0, zSig1, out );
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Rounds the single-precision floating-point value `a' to an integer,
			
 
				+and returns the result as a single-precision floating-point value.  The
			
 
				+operation is performed according to the IEC/IEEE Standard for Binary
			
 
				+Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_round_to_int( a: float32): float32;
			
 
				+  Var
			
 
				+    aSign: flag;
			
 
				+    aExp: int16;
			
 
				+    lastBitMask, roundBitsMask: bits32;
			
 
				+    roundingMode: int8;
			
 
				+    z: float32;
			
 
				+  Begin
			
 
				+    aExp := extractFloat32Exp( a );
			
 
				+    if ( $96 <= aExp ) then
			
 
				+     Begin
			
 
				+        if ( ( aExp = $FF ) and (extractFloat32Frac( a )<>0) ) then
			
 
				+          Begin
			
 
				+            float32_round_to_int:= propagateFloat32NaN( a, a );
			
 
				+            exit;
			
 
				+          End;
			
 
				+        float32_round_to_int:=a;
			
 
				+        exit;
			
 
				+     End;
			
 
				+    if ( aExp <= $7E ) then
			
 
				+      Begin
			
 
				+        if ( bits32 ( a shl 1 ) = 0 ) then
			
 
				+          Begin
			
 
				+             float32_round_to_int:=a;
			
 
				+             exit;
			
 
				+          end;
			
 
				+        float_exception_flags
			
 
				+          := float_exception_flags OR  float_flag_inexact;
			
 
				+        aSign := extractFloat32Sign( a );
			
 
				+
			
 
				+        case ( float_rounding_mode ) of
			
 
				+         float_round_nearest_even:
			
 
				+            Begin
			
 
				+              if ( ( aExp = $7E ) and (extractFloat32Frac( a )<>0) ) then
			
 
				+                Begin
			
 
				+                  float32_round_to_int := packFloat32( aSign, $7F, 0 );
			
 
				+                  exit;
			
 
				+                End;
			
 
				+            End;
			
 
				+         float_round_down:
			
 
				+            Begin
			
 
				+              if aSign <> 0 then
			
 
				+                 float32_round_to_int := $BF800000
			
 
				+              else
			
 
				+                 float32_round_to_int := 0;
			
 
				+              exit;
			
 
				+            End;
			
 
				+         float_round_up:
			
 
				+            Begin
			
 
				+              if aSign <> 0 then
			
 
				+                 float32_round_to_int := $80000000
			
 
				+              else
			
 
				+                 float32_round_to_int := $3F800000;
			
 
				+              exit;
			
 
				+            End;
			
 
				+        end;
			
 
				+        float32_round_to_int := packFloat32( aSign, 0, 0 );
			
 
				+      End;
			
 
				+    lastBitMask := 1;
			
 
				+    {_____________________________!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!}
			
 
				+    lastBitMask := lastBitMask shl ($96 - aExp);
			
 
				+    roundBitsMask := lastBitMask - 1;
			
 
				+    z := a;
			
 
				+    roundingMode := float_rounding_mode;
			
 
				+    if ( roundingMode = float_round_nearest_even ) then
			
 
				+      Begin
			
 
				+        z := z + (lastBitMask shr 1);
			
 
				+        if ( ( z and roundBitsMask ) = 0 ) then
			
 
				+           z := z and not lastBitMask;
			
 
				+      End
			
 
				+    else if ( roundingMode <> float_round_to_zero ) then
			
 
				+      Begin
			
 
				+        if ( (extractFloat32Sign( z ) xor flag(roundingMode = float_round_up ))<>0 ) then
			
 
				+          Begin
			
 
				+            z := z + roundBitsMask;
			
 
				+          End;
			
 
				+      End;
			
 
				+    z := z and not roundBitsMask;
			
 
				+    if ( z <> a ) then
			
 
				+      float_exception_flags := float_exception_flags or float_flag_inexact;
			
 
				+    float32_round_to_int := z;
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of adding the absolute values of the single-precision
			
 
				+floating-point values `a' and `b'.  If `zSign' is 1, the sum is negated
			
 
				+before being returned.  `zSign' is ignored if the result is a NaN.
			
 
				+The addition is performed according to the IEC/IEEE Standard for Binary
			
 
				+Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function addFloat32Sigs( a:float32; b: float32; zSign:flag ): float32;
			
 
				+  Var
			
 
				+    aExp, bExp, zExp: int16;
			
 
				+    aSig, bSig, zSig: bits32;
			
 
				+    expDiff: int16;
			
 
				+    label roundAndPack;
			
 
				+  Begin
			
 
				+    aSig:=extractFloat32Frac( a );
			
 
				+    aExp:=extractFloat32Exp( a );
			
 
				+    bSig:=extractFloat32Frac( b );
			
 
				+    bExp := extractFloat32Exp( b );
			
 
				+    expDiff := aExp - bExp;
			
 
				+    aSig := aSig shl 6;
			
 
				+    bSig := bSig shl 6;
			
 
				+    if ( 0 < expDiff ) then
			
 
				+    Begin
			
 
				+        if ( aExp = $FF ) then
			
 
				+          Begin
			
 
				+            if ( aSig <> 0) then
			
 
				+              Begin
			
 
				+                addFloat32Sigs := propagateFloat32NaN( a, b );
			
 
				+                exit;
			
 
				+              End;
			
 
				+            addFloat32Sigs := a;
			
 
				+            exit;
			
 
				+          End;
			
 
				+        if ( bExp = 0 ) then
			
 
				+          Begin
			
 
				+             Dec(expDiff);
			
 
				+          End
			
 
				+        else
			
 
				+          Begin
			
 
				+            bSig := bSig or $20000000;
			
 
				+          End;
			
 
				+        shift32RightJamming( bSig, expDiff, bSig );
			
 
				+        zExp := aExp;
			
 
				+    End
			
 
				+    else
			
 
				+    If ( expDiff < 0 ) then
			
 
				+      Begin
			
 
				+        if ( bExp = $FF ) then
			
 
				+        Begin
			
 
				+            if ( bSig<>0 ) then
			
 
				+              Begin
			
 
				+                addFloat32Sigs := propagateFloat32NaN( a, b );
			
 
				+                exit;
			
 
				+              end;
			
 
				+
			
 
				+            addFloat32Sigs := packFloat32( zSign, $FF, 0 );
			
 
				+            exit;
			
 
				+        End;
			
 
				+        if ( aExp = 0 ) then
			
 
				+          Begin
			
 
				+            Inc(expDiff);
			
 
				+          End
			
 
				+        else
			
 
				+          Begin
			
 
				+            aSig := aSig OR $20000000;
			
 
				+          End;
			
 
				+        shift32RightJamming( aSig, - expDiff, aSig );
			
 
				+        zExp := bExp;
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        if ( aExp = $FF ) then
			
 
				+        Begin
			
 
				+            if ( aSig OR  bSig )<> 0 then
			
 
				+              Begin
			
 
				+                addFloat32Sigs := propagateFloat32NaN( a, b );
			
 
				+                exit;
			
 
				+              end;
			
 
				+            addFloat32Sigs := a;
			
 
				+            exit;
			
 
				+        End;
			
 
				+        if ( aExp = 0 ) then
			
 
				+          Begin
			
 
				+             addFloat32Sigs := packFloat32( zSign, 0, ( aSig + bSig ) shr 6 );
			
 
				+             exit;
			
 
				+          end;
			
 
				+        zSig := $40000000 + aSig + bSig;
			
 
				+        zExp := aExp;
			
 
				+        goto roundAndPack;
			
 
				+    End;
			
 
				+    aSig := aSig OR $20000000;
			
 
				+    zSig := ( aSig + bSig ) shl 1;
			
 
				+    Dec(zExp);
			
 
				+    if ( sbits32 (zSig) < 0 ) then
			
 
				+      Begin
			
 
				+        zSig := aSig + bSig;
			
 
				+        Inc(zExp);
			
 
				+      End;
			
 
				+ roundAndPack:
			
 
				+    addFloat32Sigs := roundAndPackFloat32( zSign, zExp, zSig );
			
 
				+ End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of subtracting the absolute values of the single-
			
 
				+precision floating-point values `a' and `b'.  If `zSign' is 1, the
			
 
				+difference is negated before being returned.  `zSign' is ignored if the
			
 
				+result is a NaN.  The subtraction is performed according to the IEC/IEEE
			
 
				+Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function subFloat32Sigs( a:float32; b:float32; zSign:flag ): float32;
			
 
				+  Var
			
 
				+    aExp, bExp, zExp: int16;
			
 
				+    aSig, bSig, zSig: bits32;
			
 
				+    expDiff : int16;
			
 
				+    label aExpBigger;
			
 
				+    label bExpBigger;
			
 
				+    label aBigger;
			
 
				+    label bBigger;
			
 
				+    label normalizeRoundAndPack;
			
 
				+  Begin
			
 
				+    aSig := extractFloat32Frac( a );
			
 
				+    aExp := extractFloat32Exp( a );
			
 
				+    bSig := extractFloat32Frac( b );
			
 
				+    bExp := extractFloat32Exp( b );
			
 
				+    expDiff := aExp - bExp;
			
 
				+    aSig := aSig shl 7;
			
 
				+    bSig := bSig shl 7;
			
 
				+    if ( 0 < expDiff ) then goto aExpBigger;
			
 
				+    if ( expDiff < 0 ) then goto bExpBigger;
			
 
				+    if ( aExp = $FF ) then
			
 
				+    Begin
			
 
				+        if ( aSig OR  bSig )<> 0 then
			
 
				+          Begin
			
 
				+           subFloat32Sigs := propagateFloat32NaN( a, b );
			
 
				+           exit;
			
 
				+          End;
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        subFloat32Sigs := float32_default_nan;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( aExp = 0 ) then
			
 
				+    Begin
			
 
				+        aExp := 1;
			
 
				+        bExp := 1;
			
 
				+    End;
			
 
				+    if ( bSig < aSig ) Then goto aBigger;
			
 
				+    if ( aSig < bSig ) Then goto bBigger;
			
 
				+    subFloat32Sigs := packFloat32( flag(float_rounding_mode = float_round_down), 0, 0 );
			
 
				+    exit;
			
 
				+ bExpBigger:
			
 
				+    if ( bExp = $FF ) then
			
 
				+    Begin
			
 
				+        if ( bSig<>0 ) then
			
 
				+        Begin
			
 
				+          subFloat32Sigs := propagateFloat32NaN( a, b );
			
 
				+          exit;
			
 
				+        End;
			
 
				+        subFloat32Sigs := packFloat32( zSign XOR 1, $FF, 0 );
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( aExp = 0 ) then
			
 
				+      Begin
			
 
				+        Inc(expDiff);
			
 
				+      End
			
 
				+    else
			
 
				+      Begin
			
 
				+        aSig := aSig OR $40000000;
			
 
				+      End;
			
 
				+    shift32RightJamming( aSig, - expDiff, aSig );
			
 
				+    bSig := bSig OR $40000000;
			
 
				+ bBigger:
			
 
				+    zSig := bSig - aSig;
			
 
				+    zExp := bExp;
			
 
				+    zSign := zSign xor 1;
			
 
				+    goto normalizeRoundAndPack;
			
 
				+ aExpBigger:
			
 
				+    if ( aExp = $FF ) then
			
 
				+      Begin
			
 
				+        if ( aSig <> 0) then
			
 
				+          Begin
			
 
				+            subFloat32Sigs := propagateFloat32NaN( a, b );
			
 
				+            exit;
			
 
				+          End;
			
 
				+        subFloat32Sigs := a;
			
 
				+        exit;
			
 
				+      End;
			
 
				+    if ( bExp = 0 ) then
			
 
				+      Begin
			
 
				+        Dec(expDiff);
			
 
				+      End
			
 
				+    else
			
 
				+      Begin
			
 
				+        bSig := bSig OR $40000000;
			
 
				+      End;
			
 
				+    shift32RightJamming( bSig, expDiff, bSig );
			
 
				+    aSig := aSig OR $40000000;
			
 
				+ aBigger:
			
 
				+    zSig := aSig - bSig;
			
 
				+    zExp := aExp;
			
 
				+ normalizeRoundAndPack:
			
 
				+    Dec(zExp);
			
 
				+    subFloat32Sigs := normalizeRoundAndPackFloat32( zSign, zExp, zSig );
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of adding the single-precision floating-point values `a'
			
 
				+and `b'.  The operation is performed according to the IEC/IEEE Standard for
			
 
				+Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_add( a: float32; b:float32 ): float32;
			
 
				+  Var
			
 
				+    aSign, bSign: Flag;
			
 
				+  Begin
			
 
				+    aSign := extractFloat32Sign( a );
			
 
				+    bSign := extractFloat32Sign( b );
			
 
				+    if ( aSign = bSign ) then
			
 
				+      Begin
			
 
				+        float32_add := addFloat32Sigs( a, b, aSign );
			
 
				+      End
			
 
				+    else
			
 
				+      Begin
			
 
				+        float32_add := subFloat32Sigs( a, b, aSign );
			
 
				+      End;
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of subtracting the single-precision floating-point values
			
 
				+`a' and `b'.  The operation is performed according to the IEC/IEEE Standard
			
 
				+for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_sub( a: float32 ; b:float32 ): float32;
			
 
				+  Var
			
 
				+    aSign, bSign: flag;
			
 
				+  Begin
			
 
				+    aSign := extractFloat32Sign( a );
			
 
				+    bSign := extractFloat32Sign( b );
			
 
				+    if ( aSign = bSign ) then
			
 
				+      Begin
			
 
				+        float32_sub := subFloat32Sigs( a, b, aSign );
			
 
				+      End
			
 
				+    else
			
 
				+      Begin
			
 
				+        float32_sub := addFloat32Sigs( a, b, aSign );
			
 
				+      End;
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of multiplying the single-precision floating-point values
			
 
				+`a' and `b'.  The operation is performed according to the IEC/IEEE Standard
			
 
				+for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_mul(a: float32; b: float32 ) : float32;
			
 
				+
			
 
				+  Var
			
 
				+    aSign, bSign, zSign: flag;
			
 
				+    aExp, bExp, zExp : int16;
			
 
				+    aSig, bSig, zSig0, zSig1: bits32;
			
 
				+  Begin
			
 
				+    aSig := extractFloat32Frac( a );
			
 
				+    aExp := extractFloat32Exp( a );
			
 
				+    aSign := extractFloat32Sign( a );
			
 
				+    bSig := extractFloat32Frac( b );
			
 
				+    bExp := extractFloat32Exp( b );
			
 
				+    bSign := extractFloat32Sign( b );
			
 
				+    zSign := aSign xor bSign;
			
 
				+    if ( aExp = $FF ) then
			
 
				+    Begin
			
 
				+        if ( (aSig<>0) OR ( ( bExp = $FF ) AND  (bSig<>0) ) ) then
			
 
				+        Begin
			
 
				+            float32_mul := propagateFloat32NaN( a, b );
			
 
				+        End;
			
 
				+        if ( ( bExp OR  bSig ) = 0 ) then
			
 
				+        Begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            float32_mul := float32_default_nan;
			
 
				+            exit;
			
 
				+        End;
			
 
				+        float32_mul := packFloat32( zSign, $FF, 0 );
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( bExp = $FF ) then
			
 
				+    Begin
			
 
				+        if ( bSig <> 0 ) then
			
 
				+        Begin
			
 
				+           float32_mul := propagateFloat32NaN( a, b );
			
 
				+           exit;
			
 
				+        End;
			
 
				+        if ( ( aExp OR  aSig ) = 0 ) then
			
 
				+        Begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            float32_mul := float32_default_nan;
			
 
				+            exit;
			
 
				+        End;
			
 
				+        float32_mul := packFloat32( zSign, $FF, 0 );
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( aExp = 0 ) then
			
 
				+    Begin
			
 
				+        if ( aSig = 0 ) then
			
 
				+        Begin
			
 
				+           float32_mul := packFloat32( zSign, 0, 0 );
			
 
				+           exit;
			
 
				+        End;
			
 
				+        normalizeFloat32Subnormal( aSig, aExp, aSig );
			
 
				+    End;
			
 
				+    if ( bExp = 0 ) then
			
 
				+    Begin
			
 
				+        if ( bSig = 0 ) then
			
 
				+         Begin
			
 
				+           float32_mul := packFloat32( zSign, 0, 0 );
			
 
				+           exit;
			
 
				+         End;
			
 
				+        normalizeFloat32Subnormal( bSig, bExp, bSig );
			
 
				+    End;
			
 
				+    zExp := aExp + bExp - $7F;
			
 
				+    aSig := ( aSig OR  $00800000 ) shl 7;
			
 
				+    bSig := ( bSig OR  $00800000 ) shl 8;
			
 
				+    mul32To64( aSig, bSig, zSig0, zSig1 );
			
 
				+    zSig0 := zSig0 OR bits32( zSig1 <> 0 );
			
 
				+    if ( 0 <= sbits32 ( zSig0 shl 1 ) ) then
			
 
				+    Begin
			
 
				+        zSig0 := zSig0 shl 1;
			
 
				+        Dec(zExp);
			
 
				+    End;
			
 
				+    float32_mul := roundAndPackFloat32( zSign, zExp, zSig0 );
			
 
				+ End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of dividing the single-precision floating-point value `a'
			
 
				+by the corresponding value `b'.  The operation is performed according to the
			
 
				+IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_div(a: float32;b: float32 ): float32;
			
 
				+  Var
			
 
				+    aSign, bSign, zSign: flag;
			
 
				+    aExp, bExp, zExp: int16;
			
 
				+    aSig, bSig, zSig, rem0, rem1, term0, term1: bits32;
			
 
				+  Begin
			
 
				+    aSig := extractFloat32Frac( a );
			
 
				+    aExp := extractFloat32Exp( a );
			
 
				+    aSign := extractFloat32Sign( a );
			
 
				+    bSig := extractFloat32Frac( b );
			
 
				+    bExp := extractFloat32Exp( b );
			
 
				+    bSign := extractFloat32Sign( b );
			
 
				+    zSign := aSign xor bSign;
			
 
				+    if ( aExp = $FF ) then
			
 
				+      Begin
			
 
				+        if ( aSig <> 0 ) then
			
 
				+        Begin
			
 
				+           float32_div := propagateFloat32NaN( a, b );
			
 
				+           exit;
			
 
				+        End;
			
 
				+        if ( bExp = $FF ) then
			
 
				+        Begin
			
 
				+            if ( bSig <> 0) then
			
 
				+            Begin
			
 
				+              float32_div := propagateFloat32NaN( a, b );
			
 
				+            End;
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            float32_div := float32_default_nan;
			
 
				+            exit;
			
 
				+        End;
			
 
				+        float32_div := packFloat32( zSign, $FF, 0 );
			
 
				+        exit;
			
 
				+      End;
			
 
				+    if ( bExp = $FF ) then
			
 
				+    Begin
			
 
				+        if ( bSig <> 0) then
			
 
				+        Begin
			
 
				+          float32_div := propagateFloat32NaN( a, b );
			
 
				+          exit;
			
 
				+        End;
			
 
				+        float32_div := packFloat32( zSign, 0, 0 );
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( bExp = 0 ) Then
			
 
				+    Begin
			
 
				+        if ( bSig = 0 ) Then
			
 
				+        Begin
			
 
				+            if ( ( aExp OR  aSig ) = 0 ) then
			
 
				+            Begin
			
 
				+                float_raise( float_flag_invalid );
			
 
				+                float32_div := float32_default_nan;
			
 
				+                exit;
			
 
				+            End;
			
 
				+            float_raise( float_flag_divbyzero );
			
 
				+            float32_div := packFloat32( zSign, $FF, 0 );
			
 
				+            exit;
			
 
				+        End;
			
 
				+        normalizeFloat32Subnormal( bSig, bExp, bSig );
			
 
				+    End;
			
 
				+    if ( aExp = 0 ) Then
			
 
				+    Begin
			
 
				+        if ( aSig = 0 ) Then
			
 
				+        Begin
			
 
				+          float32_div := packFloat32( zSign, 0, 0 );
			
 
				+          exit;
			
 
				+        End;
			
 
				+        normalizeFloat32Subnormal( aSig, aExp, aSig );
			
 
				+    End;
			
 
				+    zExp := aExp - bExp + $7D;
			
 
				+    aSig := ( aSig OR  $00800000 ) shl 7;
			
 
				+    bSig := ( bSig OR  $00800000 ) shl 8;
			
 
				+    if ( bSig <= ( aSig + aSig ) ) then
			
 
				+    Begin
			
 
				+        aSig := aSig shr 1;
			
 
				+        Inc(zExp);
			
 
				+    End;
			
 
				+    zSig := estimateDiv64To32( aSig, 0, bSig );
			
 
				+    if ( ( zSig and $3F ) <= 2 ) then
			
 
				+    Begin
			
 
				+        mul32To64( bSig, zSig, term0, term1 );
			
 
				+        sub64( aSig, 0, term0, term1, rem0, rem1 );
			
 
				+        while ( sbits32 (rem0) < 0 ) do
			
 
				+        Begin
			
 
				+            Dec(zSig);
			
 
				+            add64( rem0, rem1, 0, bSig, rem0, rem1 );
			
 
				+        End;
			
 
				+        zSig := zSig or bits32( rem1 <> 0 );
			
 
				+    End;
			
 
				+    float32_div := roundAndPackFloat32( zSign, zExp, zSig );
			
 
				+
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the remainder of the single-precision floating-point value `a'
			
 
				+with respect to the corresponding value `b'.  The operation is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_rem(a: float32; b: float32 ):float32;
			
 
				+  Var
			
 
				+    aSign, bSign, zSign: flag;
			
 
				+    aExp, bExp, expDiff: int16;
			
 
				+    aSig, bSig, q, allZero, alternateASig: bits32;
			
 
				+    sigMean: sbits32;
			
 
				+  Begin
			
 
				+    aSig := extractFloat32Frac( a );
			
 
				+    aExp := extractFloat32Exp( a );
			
 
				+    aSign := extractFloat32Sign( a );
			
 
				+    bSig := extractFloat32Frac( b );
			
 
				+    bExp := extractFloat32Exp( b );
			
 
				+    bSign := extractFloat32Sign( b );
			
 
				+    if ( aExp = $FF ) then
			
 
				+    Begin
			
 
				+        if ( (aSig<>0) OR ( ( bExp = $FF ) AND  (bSig <>0)) ) then
			
 
				+        Begin
			
 
				+            float32_rem := propagateFloat32NaN( a, b );
			
 
				+            exit;
			
 
				+        End;
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        float32_rem := float32_default_nan;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( bExp = $FF ) then
			
 
				+    Begin
			
 
				+        if ( bSig <> 0 ) then
			
 
				+        Begin
			
 
				+          float32_rem := propagateFloat32NaN( a, b );
			
 
				+          exit;
			
 
				+        End;
			
 
				+        float32_rem := a;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( bExp = 0 ) then
			
 
				+    Begin
			
 
				+        if ( bSig = 0 ) then
			
 
				+        Begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            float32_rem := float32_default_nan;
			
 
				+            exit;
			
 
				+        End;
			
 
				+        normalizeFloat32Subnormal( bSig, bExp, bSig );
			
 
				+    End;
			
 
				+    if ( aExp = 0 ) then
			
 
				+    Begin
			
 
				+        if ( aSig = 0 ) then
			
 
				+        Begin
			
 
				+           float32_rem := a;
			
 
				+           exit;
			
 
				+        End;
			
 
				+        normalizeFloat32Subnormal( aSig, aExp, aSig );
			
 
				+    End;
			
 
				+    expDiff := aExp - bExp;
			
 
				+    aSig := ( aSig OR  $00800000 ) shl 8;
			
 
				+    bSig := ( bSig OR  $00800000 ) shl 8;
			
 
				+    if ( expDiff < 0 ) then
			
 
				+    Begin
			
 
				+        if ( expDiff < -1 ) then
			
 
				+        Begin
			
 
				+           float32_rem := a;
			
 
				+           exit;
			
 
				+        End;
			
 
				+        aSig := aSig shr 1;
			
 
				+    End;
			
 
				+    q := bits32( bSig <= aSig );
			
 
				+    if ( q <> 0) then
			
 
				+       aSig := aSig - bSig;
			
 
				+    expDiff := expDiff - 32;
			
 
				+    while ( 0 < expDiff ) do
			
 
				+    Begin
			
 
				+        q := estimateDiv64To32( aSig, 0, bSig );
			
 
				+        if (2 < q) then
			
 
				+         q := q - 2
			
 
				+        else
			
 
				+         q := 0;
			
 
				+        aSig := - ( ( bSig shr 2 ) * q );
			
 
				+        expDiff := expDiff - 30;
			
 
				+    End;
			
 
				+    expDiff := expDiff + 32;
			
 
				+    if ( 0 < expDiff ) then
			
 
				+    Begin
			
 
				+        q := estimateDiv64To32( aSig, 0, bSig );
			
 
				+        if (2 < q) then
			
 
				+         q := q - 2
			
 
				+        else
			
 
				+         q := 0;
			
 
				+        q := q shr (32 - expDiff);
			
 
				+        bSig := bSig shr 2;
			
 
				+        aSig := ( ( aSig shr 1 ) shl ( expDiff - 1 ) ) - bSig * q;
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        aSig := aSig shr 2;
			
 
				+        bSig := bSig shr 2;
			
 
				+    End;
			
 
				+    Repeat
			
 
				+        alternateASig := aSig;
			
 
				+        Inc(q);
			
 
				+        aSig := aSig - bSig;
			
 
				+    Until not ( 0 <= sbits32 (aSig) );
			
 
				+    sigMean := aSig + alternateASig;
			
 
				+    if ( ( sigMean < 0 ) OR ( ( sigMean = 0 ) AND  (( q and 1 )<>0) ) ) then
			
 
				+    Begin
			
 
				+        aSig := alternateASig;
			
 
				+    End;
			
 
				+    zSign := flag( sbits32 (aSig) < 0 );
			
 
				+    if ( zSign<>0 ) then
			
 
				+      aSig := - aSig;
			
 
				+    float32_rem := normalizeRoundAndPackFloat32( aSign xor zSign, bExp, aSig );
			
 
				+  End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the square root of the single-precision floating-point value `a'.
			
 
				+The operation is performed according to the IEC/IEEE Standard for Binary
			
 
				+Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_sqrt(a: float32 ): float32;
			
 
				+Var
			
 
				+    aSign : flag;
			
 
				+    aExp, zExp : int16;
			
 
				+    aSig, zSig, rem0, rem1, term0, term1: bits32;
			
 
				+    label roundAndPack;
			
 
				+Begin
			
 
				+    aSig := extractFloat32Frac( a );
			
 
				+    aExp := extractFloat32Exp( a );
			
 
				+    aSign := extractFloat32Sign( a );
			
 
				+    if ( aExp = $FF ) then
			
 
				+    Begin
			
 
				+        if ( aSig <> 0) then
			
 
				+        Begin
			
 
				+           float32_sqrt := propagateFloat32NaN( a, 0 );
			
 
				+           exit;
			
 
				+        End;
			
 
				+        if ( aSign = 0) then
			
 
				+        Begin
			
 
				+          float32_sqrt := a;
			
 
				+          exit;
			
 
				+        End;
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        float32_sqrt := float32_default_nan;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( aSign <> 0) then
			
 
				+    Begin
			
 
				+        if ( ( aExp OR  aSig ) = 0 ) then
			
 
				+        Begin
			
 
				+           float32_sqrt := a;
			
 
				+           exit;
			
 
				+        End;
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        float32_sqrt := float32_default_nan;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( aExp = 0 ) then
			
 
				+    Begin
			
 
				+        if ( aSig = 0 ) then
			
 
				+        Begin
			
 
				+           float32_sqrt := 0;
			
 
				+           exit;
			
 
				+        End;
			
 
				+        normalizeFloat32Subnormal( aSig, aExp, aSig );
			
 
				+    End;
			
 
				+    zExp := ( ( aExp - $7F ) shr 1 ) + $7E;
			
 
				+    aSig := ( aSig OR  $00800000 ) shl 8;
			
 
				+    zSig := estimateSqrt32( aExp, aSig ) + 2;
			
 
				+    if ( ( zSig and $7F ) <= 5 ) then
			
 
				+    Begin
			
 
				+        if ( zSig < 2 ) then
			
 
				+        Begin
			
 
				+            zSig := $7FFFFFFF;
			
 
				+            goto roundAndPack;
			
 
				+        End
			
 
				+        else
			
 
				+        Begin
			
 
				+            aSig  := aSig shr (aExp and 1);
			
 
				+            mul32To64( zSig, zSig, term0, term1 );
			
 
				+            sub64( aSig, 0, term0, term1, rem0, rem1 );
			
 
				+            while ( sbits32 (rem0) < 0 ) do
			
 
				+            Begin
			
 
				+                Dec(zSig);
			
 
				+                shortShift64Left( 0, zSig, 1, term0, term1 );
			
 
				+                term1 := term1 or 1;
			
 
				+                add64( rem0, rem1, term0, term1, rem0, rem1 );
			
 
				+            End;
			
 
				+            zSig := zSig OR bits32( ( rem0 OR  rem1 ) <> 0 );
			
 
				+        End;
			
 
				+    End;
			
 
				+    shift32RightJamming( zSig, 1, zSig );
			
 
				+ roundAndPack:
			
 
				+    float32_sqrt := roundAndPackFloat32( 0, zExp, zSig );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the single-precision floating-point value `a' is equal to
			
 
				+the corresponding value `b', and 0 otherwise.  The comparison is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_eq( a:float32; b:float32): flag;
			
 
				+Begin
			
 
				+    if ((( extractFloat32Exp( a ) = $FF ) AND  (extractFloat32Frac( a )<>0))
			
 
				+         OR ( ( extractFloat32Exp( b ) = $FF ) AND  (extractFloat32Frac( b )<>0) )
			
 
				+       ) then
			
 
				+    Begin
			
 
				+        if ( (float32_is_signaling_nan( a )<>0) OR (float32_is_signaling_nan( b )<>0) ) then
			
 
				+        Begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+        End;
			
 
				+        float32_eq := 0;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    float32_eq := flag( a = b ) OR flag( bits32 ( ( a OR  b ) shl 1 ) = 0 );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the single-precision floating-point value `a' is less than
			
 
				+or equal to the corresponding value `b', and 0 otherwise.  The comparison
			
 
				+is performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_le( a: float32; b : float32 ):flag;
			
 
				+var
			
 
				+    aSign, bSign: flag;
			
 
				+Begin
			
 
				+
			
 
				+    if (    ( ( extractFloat32Exp( a ) = $FF ) AND  (extractFloat32Frac( a )<>0) )
			
 
				+         OR ( ( extractFloat32Exp( b ) = $FF ) AND  (extractFloat32Frac( b )<>0) )
			
 
				+       ) then
			
 
				+    Begin
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        float32_le := 0;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    aSign := extractFloat32Sign( a );
			
 
				+    bSign := extractFloat32Sign( b );
			
 
				+    if ( aSign <> bSign ) then
			
 
				+    Begin
			
 
				+       float32_le :=  aSign OR flag( bits32 ( ( a OR  b ) shl 1 ) = 0 );
			
 
				+       exit;
			
 
				+    End;
			
 
				+    float32_le := flag(flag( a = b ) OR flag( aSign xor flag( a < b ) ));
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the single-precision floating-point value `a' is less than
			
 
				+the corresponding value `b', and 0 otherwise.  The comparison is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_lt( a:float32 ; b : float32): flag;
			
 
				+var
			
 
				+    aSign, bSign: flag;
			
 
				+Begin
			
 
				+
			
 
				+    if (    ( ( extractFloat32Exp( a ) = $FF ) AND  (extractFloat32Frac( a ) <>0))
			
 
				+         OR ( ( extractFloat32Exp( b ) = $FF ) AND  (extractFloat32Frac( b ) <>0) )
			
 
				+       ) then
			
 
				+    Begin
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        float32_lt :=0;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    aSign := extractFloat32Sign( a );
			
 
				+    bSign := extractFloat32Sign( b );
			
 
				+    if ( aSign <> bSign ) then
			
 
				+    Begin
			
 
				+       float32_lt := aSign AND  flag( bits32 ( ( a OR  b ) shl 1 ) <> 0 );
			
 
				+       exit;
			
 
				+    End;
			
 
				+    float32_lt := flag(flag( a <> b ) AND  flag( aSign xor flag( a < b ) ));
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the single-precision floating-point value `a' is equal to
			
 
				+the corresponding value `b', and 0 otherwise.  The invalid exception is
			
 
				+raised if either operand is a NaN.  Otherwise, the comparison is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_eq_signaling( a: float32; b: float32) : flag;
			
 
				+Begin
			
 
				+
			
 
				+    if (    ( ( extractFloat32Exp( a ) = $FF ) AND  (extractFloat32Frac( a ) <> 0))
			
 
				+         OR ( ( extractFloat32Exp( b ) = $FF ) AND  (extractFloat32Frac( b ) <> 0))
			
 
				+       ) then
			
 
				+    Begin
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        float32_eq_signaling := 0;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    float32_eq_signaling := (flag( a = b ) OR flag( bits32 ( ( a OR  b ) shl 1 ) = 0 ));
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the single-precision floating-point value `a' is less than or
			
 
				+equal to the corresponding value `b', and 0 otherwise.  Quiet NaNs do not
			
 
				+cause an exception.  Otherwise, the comparison is performed according to the
			
 
				+IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_le_quiet( a: float32 ; b : float32 ): flag;
			
 
				+Var
			
 
				+    aSign, bSign: flag;
			
 
				+    aExp, bExp: int16;
			
 
				+Begin
			
 
				+    if (    ( ( extractFloat32Exp( a ) = $FF ) AND  (extractFloat32Frac( a )<>0) )
			
 
				+         OR ( ( extractFloat32Exp( b ) = $FF ) AND  (extractFloat32Frac( b )<>0) )
			
 
				+       ) then
			
 
				+    Begin
			
 
				+        if ( (float32_is_signaling_nan( a )<>0) OR (float32_is_signaling_nan( b )<>0) ) then
			
 
				+        Begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+        End;
			
 
				+        float32_le_quiet := 0;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    aSign := extractFloat32Sign( a );
			
 
				+    bSign := extractFloat32Sign( b );
			
 
				+    if ( aSign <> bSign ) then
			
 
				+    Begin
			
 
				+       float32_le_quiet := aSign OR flag( bits32 ( ( a OR  b ) shl 1 ) = 0 );
			
 
				+       exit;
			
 
				+    End;
			
 
				+    float32_le_quiet := flag(flag( a = b ) OR flag( aSign xor flag( a < b ) ));
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the single-precision floating-point value `a' is less than
			
 
				+the corresponding value `b', and 0 otherwise.  Quiet NaNs do not cause an
			
 
				+exception.  Otherwise, the comparison is performed according to the IEC/IEEE
			
 
				+Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float32_lt_quiet( a: float32 ; b: float32 ): flag;
			
 
				+Var
			
 
				+   aSign, bSign: flag;
			
 
				+Begin
			
 
				+    if (    ( ( extractFloat32Exp( a ) = $FF ) AND  (extractFloat32Frac( a )<>0) )
			
 
				+         OR ( ( extractFloat32Exp( b ) = $FF ) AND  (extractFloat32Frac( b )<>0) )
			
 
				+       ) then
			
 
				+    Begin
			
 
				+        if ( (float32_is_signaling_nan( a )<>0) OR (float32_is_signaling_nan( b )<>0) ) then
			
 
				+        Begin
			
 
				+            float_raise( float_flag_invalid );
			
 
				+        End;
			
 
				+        float32_lt_quiet := 0;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    aSign := extractFloat32Sign( a );
			
 
				+    bSign := extractFloat32Sign( b );
			
 
				+    if ( aSign <> bSign ) then
			
 
				+    Begin
			
 
				+        float32_lt_quiet := aSign AND  flag( bits32 ( ( a OR  b ) shl 1 ) <> 0 );
			
 
				+        exit;
			
 
				+    End;
			
 
				+    float32_lt_quiet := flag(flag( a <> b ) AND  ( aSign xor flag( a < b ) ));
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the double-precision floating-point value
			
 
				+`a' to the 32-bit two's complement integer format.  The conversion is
			
 
				+performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic---which means in particular that the conversion is rounded
			
 
				+according to the current rounding mode.  If `a' is a NaN, the largest
			
 
				+positive integer is returned.  Otherwise, if the conversion overflows, the
			
 
				+largest integer with the same sign as `a' is returned.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_to_int32(a: float64): int32;
			
 
				+var
			
 
				+    aSign: flag;
			
 
				+    aExp, shiftCount: int16;
			
 
				+    aSig0, aSig1, absZ, aSigExtra: bits32;
			
 
				+    z: int32;
			
 
				+    roundingMode: int8;
			
 
				+    label invalid;
			
 
				+Begin
			
 
				+    aSig1 := extractFloat64Frac1( a );
			
 
				+    aSig0 := extractFloat64Frac0( a );
			
 
				+    aExp := extractFloat64Exp( a );
			
 
				+    aSign := extractFloat64Sign( a );
			
 
				+    shiftCount := aExp - $413;
			
 
				+    if ( 0 <= shiftCount ) then
			
 
				+    Begin
			
 
				+        if ( $41E < aExp ) then
			
 
				+        Begin
			
 
				+            if ( ( aExp = $7FF ) AND  (( aSig0 OR  aSig1 )<>0) ) then
			
 
				+               aSign := 0;
			
 
				+            goto invalid;
			
 
				+        End;
			
 
				+        shortShift64Left(
			
 
				+            aSig0 OR  $00100000, aSig1, shiftCount, absZ, aSigExtra );
			
 
				+        if ( $80000000 < absZ ) then
			
 
				+          goto invalid;
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        aSig1 := flag( aSig1 <> 0 );
			
 
				+        if ( aExp < $3FE ) then
			
 
				+        Begin
			
 
				+            aSigExtra := aExp OR  aSig0 OR  aSig1;
			
 
				+            absZ := 0;
			
 
				+        End
			
 
				+        else
			
 
				+        Begin
			
 
				+            aSig0 := aSig0 OR $00100000;
			
 
				+            aSigExtra := ( aSig0 shl ( shiftCount and 31 ) ) OR  aSig1;
			
 
				+            absZ := aSig0 shr ( - shiftCount );
			
 
				+        End;
			
 
				+    End;
			
 
				+    roundingMode := float_rounding_mode;
			
 
				+    if ( roundingMode = float_round_nearest_even ) then
			
 
				+    Begin
			
 
				+        if ( sbits32(aSigExtra) < 0 ) then
			
 
				+        Begin
			
 
				+            Inc(absZ);
			
 
				+            if ( bits32 ( aSigExtra shl 1 ) = 0 ) then
			
 
				+               absZ :=  absZ and not 1;
			
 
				+        End;
			
 
				+        if aSign <> 0 then
			
 
				+          z := - absZ
			
 
				+        else
			
 
				+          z := absZ;
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        aSigExtra := bits32( aSigExtra <> 0 );
			
 
				+        if ( aSign <> 0) then
			
 
				+        Begin
			
 
				+            z := - (   absZ
			
 
				+                    + ( int32( roundingMode = float_round_down ) and aSigExtra ) );
			
 
				+        End
			
 
				+        else
			
 
				+        Begin
			
 
				+            z := absZ + ( int32( roundingMode = float_round_up ) and aSigExtra );
			
 
				+        End
			
 
				+    End;
			
 
				+    if ( (( aSign xor flag( z < 0 ) )<>0) AND  (z<>0) ) then
			
 
				+    Begin
			
 
				+ invalid:
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        if (aSign <> 0 ) then
			
 
				+          float64_to_int32 := sbits32 ($80000000)
			
 
				+        else
			
 
				+          float64_to_int32 :=  $7FFFFFFF;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( aSigExtra <> 0) then
			
 
				+       float_exception_flags := float_exception_flags or float_flag_inexact;
			
 
				+    float64_to_int32 := z;
			
 
				+End;
			
 
				+
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the double-precision floating-point value
			
 
				+`a' to the 32-bit two's complement integer format.  The conversion is
			
 
				+performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic, except that the conversion is always rounded toward zero.
			
 
				+If `a' is a NaN, the largest positive integer is returned.  Otherwise, if
			
 
				+the conversion overflows, the largest integer with the same sign as `a' is
			
 
				+returned.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_to_int32_round_to_zero(a: float64 ): int32;
			
 
				+Var
			
 
				+    aSign: flag;
			
 
				+    aExp, shiftCount: int16;
			
 
				+    aSig0, aSig1, absZ, aSigExtra: bits32;
			
 
				+    z: int32;
			
 
				+    label invalid;
			
 
				+ Begin
			
 
				+    aSig1 := extractFloat64Frac1( a );
			
 
				+    aSig0 := extractFloat64Frac0( a );
			
 
				+    aExp := extractFloat64Exp( a );
			
 
				+    aSign := extractFloat64Sign( a );
			
 
				+    shiftCount := aExp - $413;
			
 
				+    if ( 0 <= shiftCount ) then
			
 
				+    Begin
			
 
				+        if ( $41E < aExp ) then
			
 
				+        Begin
			
 
				+            if ( ( aExp = $7FF ) AND  (( aSig0 OR  aSig1 )<>0) ) then
			
 
				+               aSign := 0;
			
 
				+            goto invalid;
			
 
				+        End;
			
 
				+        shortShift64Left(
			
 
				+            aSig0 OR  $00100000, aSig1, shiftCount, absZ, aSigExtra );
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        if ( aExp < $3FF ) then
			
 
				+        Begin
			
 
				+            if ( aExp OR  aSig0 OR  aSig1 )<>0 then
			
 
				+            Begin
			
 
				+                float_exception_flags :=
			
 
				+                  float_exception_flags or float_flag_inexact;
			
 
				+            End;
			
 
				+            float64_to_int32_round_to_zero := 0;
			
 
				+            exit;
			
 
				+        End;
			
 
				+        aSig0 := aSig0 or $00100000;
			
 
				+        aSigExtra := ( aSig0 shl ( shiftCount and 31 ) ) OR  aSig1;
			
 
				+        absZ := aSig0 shr ( - shiftCount );
			
 
				+    End;
			
 
				+    if aSign <> 0 then
			
 
				+      z := - absZ
			
 
				+    else
			
 
				+      z := absZ;
			
 
				+    if ( (( aSign xor flag( z < 0 )) <> 0) AND  (z<>0) ) then
			
 
				+    Begin
			
 
				+ invalid:
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        if (aSign <> 0) then
			
 
				+          float64_to_int32_round_to_zero := sbits32 ($80000000)
			
 
				+        else
			
 
				+          float64_to_int32_round_to_zero :=  $7FFFFFFF;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( aSigExtra <> 0) then
			
 
				+       float_exception_flags := float_exception_flags or float_flag_inexact;
			
 
				+    float64_to_int32_round_to_zero := z;
			
 
				+ End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of converting the double-precision floating-point value
			
 
				+`a' to the single-precision floating-point format.  The conversion is
			
 
				+performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_to_float32(a: float64 ): float32;
			
 
				+Var
			
 
				+    aSign: flag;
			
 
				+    aExp: int16;
			
 
				+    aSig0, aSig1, zSig: bits32;
			
 
				+    allZero: bits32;
			
 
				+    tmp : CommonNanT;
			
 
				+Begin
			
 
				+    aSig1 := extractFloat64Frac1( a );
			
 
				+    aSig0 := extractFloat64Frac0( a );
			
 
				+    aExp := extractFloat64Exp( a );
			
 
				+    aSign := extractFloat64Sign( a );
			
 
				+    if ( aExp = $7FF ) then
			
 
				+    Begin
			
 
				+        if ( aSig0 OR  aSig1 ) <> 0 then
			
 
				+        Begin
			
 
				+            float64ToCommonNaN( a, tmp );
			
 
				+            float64_to_float32 := commonNaNToFloat32( tmp );
			
 
				+            exit;
			
 
				+        End;
			
 
				+        float64_to_float32 := packFloat32( aSign, $FF, 0 );
			
 
				+        exit;
			
 
				+    End;
			
 
				+    shift64RightJamming( aSig0, aSig1, 22, allZero, zSig );
			
 
				+    if ( aExp <> 0) then
			
 
				+      zSig := zSig OR $40000000;
			
 
				+    float64_to_float32 := roundAndPackFloat32( aSign, aExp - $381, zSig );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Rounds the double-precision floating-point value `a' to an integer,
			
 
				+and returns the result as a double-precision floating-point value.  The
			
 
				+operation is performed according to the IEC/IEEE Standard for Binary
			
 
				+Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_round_to_int(a: float64; var out: float64 );
			
 
				+Var
			
 
				+    aSign: flag;
			
 
				+    aExp: int16;
			
 
				+    lastBitMask, roundBitsMask: bits32;
			
 
				+    roundingMode: int8;
			
 
				+    z: float64;
			
 
				+Begin
			
 
				+    aExp := extractFloat64Exp( a );
			
 
				+    if ( $413 <= aExp ) then
			
 
				+    Begin
			
 
				+        if ( $433 <= aExp ) then
			
 
				+        Begin
			
 
				+            if (    ( aExp = $7FF )
			
 
				+                 AND
			
 
				+            (
			
 
				+            ( extractFloat64Frac0( a ) OR  extractFloat64Frac1( a )
			
 
				+            ) <>0)
			
 
				+            )  then
			
 
				+            Begin
			
 
				+                propagateFloat64NaN( a, a, out );
			
 
				+                exit;
			
 
				+            End;
			
 
				+            out := a;
			
 
				+            exit;
			
 
				+        End;
			
 
				+        lastBitMask := 1;
			
 
				+        lastBitMask := ( lastBitMask shl ( $432 - aExp ) ) shl 1;
			
 
				+        roundBitsMask := lastBitMask - 1;
			
 
				+        z := a;
			
 
				+        roundingMode := float_rounding_mode;
			
 
				+        if ( roundingMode = float_round_nearest_even ) then
			
 
				+        Begin
			
 
				+            if ( lastBitMask <> 0) then
			
 
				+            Begin
			
 
				+                add64( z.high, z.low, 0, lastBitMask shr 1, z.high, z.low );
			
 
				+                if ( ( z.low and roundBitsMask ) = 0 ) then
			
 
				+                   z.low := z.low and not lastBitMask;
			
 
				+            End
			
 
				+            else
			
 
				+            Begin
			
 
				+                if ( sbits32 (z.low) < 0 ) then
			
 
				+                Begin
			
 
				+                    Inc(z.high);
			
 
				+                    if ( bits32 ( z.low shl 1 ) = 0 ) then
			
 
				+                      z.high := z.high and not 1;
			
 
				+                End;
			
 
				+            End;
			
 
				+        End
			
 
				+        else if ( roundingMode <> float_round_to_zero ) then
			
 
				+        Begin
			
 
				+            if (   extractFloat64Sign( z )
			
 
				+                 xor flag( roundingMode = float_round_up ) )<> 0 then
			
 
				+            Begin
			
 
				+                add64( z.high, z.low, 0, roundBitsMask, z.high, z.low );
			
 
				+            End;
			
 
				+        End;
			
 
				+        z.low := z.low and not roundBitsMask;
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        if ( aExp <= $3FE ) then
			
 
				+        Begin
			
 
				+            if ( ( ( bits32 ( a.high shl 1 ) ) OR  a.low ) = 0 ) then
			
 
				+            Begin
			
 
				+                out := a;
			
 
				+                exit;
			
 
				+            End;
			
 
				+            float_exception_flags := float_exception_flags or
			
 
				+               float_flag_inexact;
			
 
				+            aSign := extractFloat64Sign( a );
			
 
				+            case ( float_rounding_mode ) of
			
 
				+             float_round_nearest_even:
			
 
				+               Begin
			
 
				+                if (    ( aExp = $3FE )
			
 
				+                     AND  ( (extractFloat64Frac0( a ) OR  extractFloat64Frac1( a ) )<>0)
			
 
				+                   ) then
			
 
				+                Begin
			
 
				+                    packFloat64( aSign, $3FF, 0, 0, out );
			
 
				+                    exit;
			
 
				+                End;
			
 
				+
			
 
				+               End;
			
 
				+               float_round_down:
			
 
				+                Begin
			
 
				+                  if aSign<>0 then
			
 
				+                   packFloat64( 1, $3FF, 0, 0, out )
			
 
				+                  else
			
 
				+                   packFloat64( 0, 0, 0, 0, out );
			
 
				+                  exit;
			
 
				+                End;
			
 
				+             float_round_up:
			
 
				+                Begin
			
 
				+                  if aSign <> 0 then
			
 
				+                   packFloat64( 1, 0, 0, 0, out )
			
 
				+                  else
			
 
				+                   packFloat64( 0, $3FF, 0, 0, out );
			
 
				+                  exit;
			
 
				+                End;
			
 
				+            end;
			
 
				+            packFloat64( aSign, 0, 0, 0, out );
			
 
				+            exit;
			
 
				+        End;
			
 
				+        lastBitMask := 1;
			
 
				+        lastBitMask := lastBitMask shl ($413 - aExp);
			
 
				+        roundBitsMask := lastBitMask - 1;
			
 
				+        z.low := 0;
			
 
				+        z.high := a.high;
			
 
				+        roundingMode := float_rounding_mode;
			
 
				+        if ( roundingMode = float_round_nearest_even ) then
			
 
				+        Begin
			
 
				+            z.high := z.high + lastBitMask shr 1;
			
 
				+            if ( ( ( z.high and roundBitsMask ) OR  a.low ) = 0 ) then
			
 
				+            Begin
			
 
				+                z.high := z.high and not lastBitMask;
			
 
				+            End;
			
 
				+        End
			
 
				+        else if ( roundingMode <> float_round_to_zero ) then
			
 
				+        Begin
			
 
				+            if (   extractFloat64Sign( z )
			
 
				+                 xor flag( roundingMode = float_round_up ) )<> 0 then
			
 
				+            Begin
			
 
				+                z.high := z.high or bits32( a.low <> 0 );
			
 
				+                z.high := z.high + roundBitsMask;
			
 
				+            End;
			
 
				+        End;
			
 
				+        z.high := z.high and not roundBitsMask;
			
 
				+    End;
			
 
				+    if ( ( z.low <> a.low ) OR ( z.high <> a.high ) ) then
			
 
				+    Begin
			
 
				+        float_exception_flags :=
			
 
				+          float_exception_flags or float_flag_inexact;
			
 
				+    End;
			
 
				+    out := z;
			
 
				+End;
			
 
				+
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of adding the absolute values of the double-precision
			
 
				+floating-point values `a' and `b'.  If `zSign' is 1, the sum is negated
			
 
				+before being returned.  `zSign' is ignored if the result is a NaN.
			
 
				+The addition is performed according to the IEC/IEEE Standard for Binary
			
 
				+Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure addFloat64Sigs( a:float64 ; b: float64 ; zSign:flag; Var out: float64 );
			
 
				+Var
			
 
				+    aExp, bExp, zExp: int16;
			
 
				+    aSig0, aSig1, bSig0, bSig1, zSig0, zSig1, zSig2: bits32;
			
 
				+    expDiff: int16;
			
 
				+    label shiftRight1;
			
 
				+    label roundAndPack;
			
 
				+Begin
			
 
				+    aSig1 := extractFloat64Frac1( a );
			
 
				+    aSig0 := extractFloat64Frac0( a );
			
 
				+    aExp := extractFloat64Exp( a );
			
 
				+    bSig1 := extractFloat64Frac1( b );
			
 
				+    bSig0 := extractFloat64Frac0( b );
			
 
				+    bExp := extractFloat64Exp( b );
			
 
				+    expDiff := aExp - bExp;
			
 
				+    if ( 0 < expDiff ) then
			
 
				+    Begin
			
 
				+        if ( aExp = $7FF ) then
			
 
				+        Begin
			
 
				+            if ( aSig0 OR  aSig1 ) <> 0 then
			
 
				+            Begin
			
 
				+              propagateFloat64NaN( a, b, out );
			
 
				+              exit;
			
 
				+            end;
			
 
				+            out := a;
			
 
				+            exit;
			
 
				+        End;
			
 
				+        if ( bExp = 0 ) then
			
 
				+        Begin
			
 
				+            Dec(expDiff);
			
 
				+        End
			
 
				+        else
			
 
				+        Begin
			
 
				+            bSig0 := bSig0 or $00100000;
			
 
				+        End;
			
 
				+        shift64ExtraRightJamming(
			
 
				+            bSig0, bSig1, 0, expDiff, bSig0, bSig1, zSig2 );
			
 
				+        zExp := aExp;
			
 
				+    End
			
 
				+    else if ( expDiff < 0 ) then
			
 
				+    Begin
			
 
				+        if ( bExp = $7FF ) then
			
 
				+        Begin
			
 
				+            if ( bSig0 OR  bSig1 ) <> 0 then
			
 
				+            Begin
			
 
				+               propagateFloat64NaN( a, b, out );
			
 
				+               exit;
			
 
				+            End;
			
 
				+            packFloat64( zSign, $7FF, 0, 0, out );
			
 
				+        End;
			
 
				+        if ( aExp = 0 ) then
			
 
				+        Begin
			
 
				+            Inc(expDiff);
			
 
				+        End
			
 
				+        else
			
 
				+        Begin
			
 
				+            aSig0 := aSig0 or $00100000;
			
 
				+        End;
			
 
				+        shift64ExtraRightJamming(
			
 
				+            aSig0, aSig1, 0, - expDiff, aSig0, aSig1, zSig2 );
			
 
				+        zExp := bExp;
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        if ( aExp = $7FF ) then
			
 
				+        Begin
			
 
				+            if ( aSig0 OR  aSig1 OR  bSig0 OR  bSig1 ) <> 0 then
			
 
				+            Begin
			
 
				+                propagateFloat64NaN( a, b, out );
			
 
				+                exit;
			
 
				+            End;
			
 
				+            out := a;
			
 
				+            exit;
			
 
				+        End;
			
 
				+        add64( aSig0, aSig1, bSig0, bSig1, zSig0, zSig1 );
			
 
				+        if ( aExp = 0 ) then
			
 
				+        Begin
			
 
				+           packFloat64( zSign, 0, zSig0, zSig1, out );
			
 
				+           exit;
			
 
				+        End;
			
 
				+        zSig2 := 0;
			
 
				+        zSig0 := zSig0 or $00200000;
			
 
				+        zExp := aExp;
			
 
				+        goto shiftRight1;
			
 
				+    End;
			
 
				+    aSig0 := aSig0 or $00100000;
			
 
				+    add64( aSig0, aSig1, bSig0, bSig1, zSig0, zSig1 );
			
 
				+    Dec(zExp);
			
 
				+    if ( zSig0 < $00200000 ) then
			
 
				+       goto roundAndPack;
			
 
				+    Inc(zExp);
			
 
				+ shiftRight1:
			
 
				+    shift64ExtraRightJamming( zSig0, zSig1, zSig2, 1, zSig0, zSig1, zSig2 );
			
 
				+ roundAndPack:
			
 
				+    roundAndPackFloat64( zSign, zExp, zSig0, zSig1, zSig2, out );
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of subtracting the absolute values of the double-
			
 
				+precision floating-point values `a' and `b'.  If `zSign' is 1, the
			
 
				+difference is negated before being returned.  `zSign' is ignored if the
			
 
				+result is a NaN.  The subtraction is performed according to the IEC/IEEE
			
 
				+Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure subFloat64Sigs( a:float64; b: float64 ; zSign:flag; Var out: float64 );
			
 
				+Var
			
 
				+    aExp, bExp, zExp: int16;
			
 
				+    aSig0, aSig1, bSig0, bSig1, zSig0, zSig1: bits32;
			
 
				+    expDiff: int16;
			
 
				+    z: float64;
			
 
				+    label aExpBigger;
			
 
				+    label bExpBigger;
			
 
				+    label aBigger;
			
 
				+    label bBigger;
			
 
				+    label normalizeRoundAndPack;
			
 
				+Begin
			
 
				+    aSig1 := extractFloat64Frac1( a );
			
 
				+    aSig0 := extractFloat64Frac0( a );
			
 
				+    aExp := extractFloat64Exp( a );
			
 
				+    bSig1 := extractFloat64Frac1( b );
			
 
				+    bSig0 := extractFloat64Frac0( b );
			
 
				+    bExp := extractFloat64Exp( b );
			
 
				+    expDiff := aExp - bExp;
			
 
				+    shortShift64Left( aSig0, aSig1, 10, aSig0, aSig1 );
			
 
				+    shortShift64Left( bSig0, bSig1, 10, bSig0, bSig1 );
			
 
				+    if ( 0 < expDiff ) then goto aExpBigger;
			
 
				+    if ( expDiff < 0 ) then goto bExpBigger;
			
 
				+    if ( aExp = $7FF ) then
			
 
				+    Begin
			
 
				+        if ( aSig0 OR  aSig1 OR  bSig0 OR  bSig1 ) <> 0 then
			
 
				+        Begin
			
 
				+            propagateFloat64NaN( a, b, out );
			
 
				+            exit;
			
 
				+        End;
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        z.low := float64_default_nan_low;
			
 
				+        z.high := float64_default_nan_high;
			
 
				+        out := z;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( aExp = 0 ) then
			
 
				+    Begin
			
 
				+        aExp := 1;
			
 
				+        bExp := 1;
			
 
				+    End;
			
 
				+    if ( bSig0 < aSig0 ) then goto aBigger;
			
 
				+    if ( aSig0 < bSig0 ) then goto bBigger;
			
 
				+    if ( bSig1 < aSig1 ) then goto aBigger;
			
 
				+    if ( aSig1 < bSig1 ) then goto bBigger;
			
 
				+    packFloat64( flag(float_rounding_mode = float_round_down), 0, 0, 0 , out);
			
 
				+    exit;
			
 
				+ bExpBigger:
			
 
				+    if ( bExp = $7FF ) then
			
 
				+    Begin
			
 
				+        if ( bSig0 OR  bSig1 ) <> 0 then
			
 
				+        Begin
			
 
				+           propagateFloat64NaN( a, b, out );
			
 
				+           exit;
			
 
				+        End;
			
 
				+        packFloat64( zSign xor 1, $7FF, 0, 0, out );
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( aExp = 0 ) then
			
 
				+    Begin
			
 
				+        Inc(expDiff);
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        aSig0 := aSig0 or $40000000;
			
 
				+    End;
			
 
				+    shift64RightJamming( aSig0, aSig1, - expDiff, aSig0, aSig1 );
			
 
				+    bSig0 := bSig0 or $40000000;
			
 
				+ bBigger:
			
 
				+    sub64( bSig0, bSig1, aSig0, aSig1, zSig0, zSig1 );
			
 
				+    zExp := bExp;
			
 
				+    zSign := zSign xor 1;
			
 
				+    goto normalizeRoundAndPack;
			
 
				+ aExpBigger:
			
 
				+    if ( aExp = $7FF ) then
			
 
				+    Begin
			
 
				+        if ( aSig0 OR  aSig1 ) <> 0 then
			
 
				+        Begin
			
 
				+           propagateFloat64NaN( a, b, out );
			
 
				+           exit;
			
 
				+        End;
			
 
				+        out :=  a;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( bExp = 0 ) then
			
 
				+    Begin
			
 
				+        Dec(expDiff);
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        bSig0 := bSig0 or $40000000;
			
 
				+    End;
			
 
				+    shift64RightJamming( bSig0, bSig1, expDiff, bSig0, bSig1 );
			
 
				+    aSig0 := aSig0 or $40000000;
			
 
				+ aBigger:
			
 
				+    sub64( aSig0, aSig1, bSig0, bSig1, zSig0, zSig1 );
			
 
				+    zExp := aExp;
			
 
				+ normalizeRoundAndPack:
			
 
				+    Dec(zExp);
			
 
				+    normalizeRoundAndPackFloat64( zSign, zExp - 10, zSig0, zSig1, out );
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of adding the double-precision floating-point values `a'
			
 
				+and `b'.  The operation is performed according to the IEC/IEEE Standard for
			
 
				+Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_add( a: float64; b : float64; Var out : float64);
			
 
				+Var
			
 
				+    aSign, bSign: flag;
			
 
				+Begin
			
 
				+    aSign := extractFloat64Sign( a );
			
 
				+    bSign := extractFloat64Sign( b );
			
 
				+    if ( aSign = bSign ) then
			
 
				+    Begin
			
 
				+         addFloat64Sigs( a, b, aSign, out );
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        subFloat64Sigs( a, b, aSign, out );
			
 
				+    End;
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of subtracting the double-precision floating-point values
			
 
				+`a' and `b'.  The operation is performed according to the IEC/IEEE Standard
			
 
				+for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_sub(a: float64; b : float64; var out: float64);
			
 
				+Var
			
 
				+    aSign, bSign: flag;
			
 
				+Begin
			
 
				+    aSign := extractFloat64Sign( a );
			
 
				+    bSign := extractFloat64Sign( b );
			
 
				+    if ( aSign = bSign ) then
			
 
				+    Begin
			
 
				+        subFloat64Sigs( a, b, aSign, out );
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        addFloat64Sigs( a, b, aSign, out );
			
 
				+    End;
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of multiplying the double-precision floating-point values
			
 
				+`a' and `b'.  The operation is performed according to the IEC/IEEE Standard
			
 
				+for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_mul( a: float64; b:float64; Var out: float64);
			
 
				+Var
			
 
				+    aSign, bSign, zSign: flag;
			
 
				+    aExp, bExp, zExp: int16;
			
 
				+    aSig0, aSig1, bSig0, bSig1, zSig0, zSig1, zSig2, zSig3: bits32;
			
 
				+    z: float64;
			
 
				+    label invalid;
			
 
				+Begin
			
 
				+    aSig1 := extractFloat64Frac1( a );
			
 
				+    aSig0 := extractFloat64Frac0( a );
			
 
				+    aExp := extractFloat64Exp( a );
			
 
				+    aSign := extractFloat64Sign( a );
			
 
				+    bSig1 := extractFloat64Frac1( b );
			
 
				+    bSig0 := extractFloat64Frac0( b );
			
 
				+    bExp := extractFloat64Exp( b );
			
 
				+    bSign := extractFloat64Sign( b );
			
 
				+    zSign := aSign xor bSign;
			
 
				+    if ( aExp = $7FF ) then
			
 
				+    Begin
			
 
				+        if (    (( aSig0 OR  aSig1 ) <>0)
			
 
				+             OR ( ( bExp = $7FF ) AND  (( bSig0 OR  bSig1 )<>0) ) ) then
			
 
				+        Begin
			
 
				+            propagateFloat64NaN( a, b, out );
			
 
				+            exit;
			
 
				+        End;
			
 
				+        if ( ( bExp OR  bSig0 OR  bSig1 ) = 0 ) then goto invalid;
			
 
				+        packFloat64( zSign, $7FF, 0, 0, out );
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( bExp = $7FF ) then
			
 
				+    Begin
			
 
				+        if ( bSig0 OR  bSig1 )<> 0 then
			
 
				+        Begin
			
 
				+          propagateFloat64NaN( a, b, out );
			
 
				+          exit;
			
 
				+        End;
			
 
				+        if ( ( aExp OR  aSig0 OR  aSig1 ) = 0 ) then
			
 
				+        Begin
			
 
				+ invalid:
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            z.low := float64_default_nan_low;
			
 
				+            z.high := float64_default_nan_high;
			
 
				+            out := z;
			
 
				+            exit;
			
 
				+        End;
			
 
				+        packFloat64( zSign, $7FF, 0, 0, out );
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( aExp = 0 ) then
			
 
				+    Begin
			
 
				+        if ( ( aSig0 OR  aSig1 ) = 0 ) then
			
 
				+        Begin
			
 
				+           packFloat64( zSign, 0, 0, 0, out );
			
 
				+           exit;
			
 
				+        End;
			
 
				+        normalizeFloat64Subnormal( aSig0, aSig1, aExp, aSig0, aSig1 );
			
 
				+    End;
			
 
				+    if ( bExp = 0 ) then
			
 
				+    Begin
			
 
				+        if ( ( bSig0 OR  bSig1 ) = 0 ) then
			
 
				+        Begin
			
 
				+          packFloat64( zSign, 0, 0, 0, out );
			
 
				+          exit;
			
 
				+        End;
			
 
				+        normalizeFloat64Subnormal( bSig0, bSig1, bExp, bSig0, bSig1 );
			
 
				+    End;
			
 
				+    zExp := aExp + bExp - $400;
			
 
				+    aSig0 := aSig0 or $00100000;
			
 
				+    shortShift64Left( bSig0, bSig1, 12, bSig0, bSig1 );
			
 
				+    mul64To128( aSig0, aSig1, bSig0, bSig1, zSig0, zSig1, zSig2, zSig3 );
			
 
				+    add64( zSig0, zSig1, aSig0, aSig1, zSig0, zSig1 );
			
 
				+    zSig2 := zSig2 or flag( zSig3 <> 0 );
			
 
				+    if ( $00200000 <= zSig0 ) then
			
 
				+    Begin
			
 
				+        shift64ExtraRightJamming(
			
 
				+            zSig0, zSig1, zSig2, 1, zSig0, zSig1, zSig2 );
			
 
				+        Inc(zExp);
			
 
				+    End;
			
 
				+    roundAndPackFloat64( zSign, zExp, zSig0, zSig1, zSig2, out );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the result of dividing the double-precision floating-point value `a'
			
 
				+by the corresponding value `b'.  The operation is performed according to the
			
 
				+IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_div(a: float64; b : float64 ; var out: float64 );
			
 
				+Var
			
 
				+    aSign, bSign, zSign: flag;
			
 
				+    aExp, bExp, zExp: int16;
			
 
				+    aSig0, aSig1, bSig0, bSig1, zSig0, zSig1, zSig2: bits32;
			
 
				+    rem0, rem1, rem2, rem3, term0, term1, term2, term3: bits32;
			
 
				+    z: float64;
			
 
				+    label invalid;
			
 
				+Begin
			
 
				+    aSig1 := extractFloat64Frac1( a );
			
 
				+    aSig0 := extractFloat64Frac0( a );
			
 
				+    aExp := extractFloat64Exp( a );
			
 
				+    aSign := extractFloat64Sign( a );
			
 
				+    bSig1 := extractFloat64Frac1( b );
			
 
				+    bSig0 := extractFloat64Frac0( b );
			
 
				+    bExp := extractFloat64Exp( b );
			
 
				+    bSign := extractFloat64Sign( b );
			
 
				+    zSign := aSign xor bSign;
			
 
				+    if ( aExp = $7FF ) then
			
 
				+    Begin
			
 
				+        if ( aSig0 OR  aSig1 )<> 0 then
			
 
				+        Begin
			
 
				+           propagateFloat64NaN( a, b, out );
			
 
				+           exit;
			
 
				+        end;
			
 
				+        if ( bExp = $7FF ) then
			
 
				+        Begin
			
 
				+            if ( bSig0 OR  bSig1 )<>0 then
			
 
				+            Begin
			
 
				+               propagateFloat64NaN( a, b, out );
			
 
				+               exit;
			
 
				+            End;
			
 
				+            goto invalid;
			
 
				+        End;
			
 
				+        packFloat64( zSign, $7FF, 0, 0, out );
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( bExp = $7FF ) then
			
 
				+    Begin
			
 
				+        if ( bSig0 OR  bSig1 )<> 0 then
			
 
				+        Begin
			
 
				+          propagateFloat64NaN( a, b, out );
			
 
				+          exit;
			
 
				+        End;
			
 
				+        packFloat64( zSign, 0, 0, 0, out );
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( bExp = 0 ) then
			
 
				+    Begin
			
 
				+        if ( ( bSig0 OR  bSig1 ) = 0 ) then
			
 
				+        Begin
			
 
				+            if ( ( aExp OR  aSig0 OR  aSig1 ) = 0 ) then
			
 
				+            Begin
			
 
				+ invalid:
			
 
				+                float_raise( float_flag_invalid );
			
 
				+                z.low := float64_default_nan_low;
			
 
				+                z.high := float64_default_nan_high;
			
 
				+                out := z;
			
 
				+                exit;
			
 
				+            End;
			
 
				+            float_raise( float_flag_divbyzero );
			
 
				+            packFloat64( zSign, $7FF, 0, 0, out );
			
 
				+            exit;
			
 
				+        End;
			
 
				+        normalizeFloat64Subnormal( bSig0, bSig1, bExp, bSig0, bSig1 );
			
 
				+    End;
			
 
				+    if ( aExp = 0 ) then
			
 
				+    Begin
			
 
				+        if ( ( aSig0 OR  aSig1 ) = 0 ) then
			
 
				+        Begin
			
 
				+           packFloat64( zSign, 0, 0, 0, out );
			
 
				+           exit;
			
 
				+        End;
			
 
				+        normalizeFloat64Subnormal( aSig0, aSig1, aExp, aSig0, aSig1 );
			
 
				+    End;
			
 
				+    zExp := aExp - bExp + $3FD;
			
 
				+    shortShift64Left( aSig0 OR  $00100000, aSig1, 11, aSig0, aSig1 );
			
 
				+    shortShift64Left( bSig0 OR  $00100000, bSig1, 11, bSig0, bSig1 );
			
 
				+    if ( le64( bSig0, bSig1, aSig0, aSig1 )<>0 ) then
			
 
				+    Begin
			
 
				+        shift64Right( aSig0, aSig1, 1, aSig0, aSig1 );
			
 
				+        Inc(zExp);
			
 
				+    End;
			
 
				+    zSig0 := estimateDiv64To32( aSig0, aSig1, bSig0 );
			
 
				+    mul64By32To96( bSig0, bSig1, zSig0, term0, term1, term2 );
			
 
				+    sub96( aSig0, aSig1, 0, term0, term1, term2, rem0, rem1, rem2 );
			
 
				+    while ( sbits32 (rem0) < 0 ) do
			
 
				+    Begin
			
 
				+        Dec(zSig0);
			
 
				+        add96( rem0, rem1, rem2, 0, bSig0, bSig1, rem0, rem1, rem2 );
			
 
				+    End;
			
 
				+    zSig1 := estimateDiv64To32( rem1, rem2, bSig0 );
			
 
				+    if ( ( zSig1 and $3FF ) <= 4 ) then
			
 
				+    Begin
			
 
				+        mul64By32To96( bSig0, bSig1, zSig1, term1, term2, term3 );
			
 
				+        sub96( rem1, rem2, 0, term1, term2, term3, rem1, rem2, rem3 );
			
 
				+        while ( sbits32 (rem1) < 0 ) do
			
 
				+        Begin
			
 
				+            Dec(zSig1);
			
 
				+            add96( rem1, rem2, rem3, 0, bSig0, bSig1, rem1, rem2, rem3 );
			
 
				+        End;
			
 
				+        zSig1 := zSig1 or flag( ( rem1 OR  rem2 OR  rem3 ) <> 0 );
			
 
				+    End;
			
 
				+    shift64ExtraRightJamming( zSig0, zSig1, 0, 11, zSig0, zSig1, zSig2 );
			
 
				+    roundAndPackFloat64( zSign, zExp, zSig0, zSig1, zSig2, out );
			
 
				+
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the remainder of the double-precision floating-point value `a'
			
 
				+with respect to the corresponding value `b'.  The operation is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_rem(a: float64; b : float64; var out: float64);
			
 
				+Var
			
 
				+    aSign, bSign, zSign: flag;
			
 
				+    aExp, bExp, expDiff: int16;
			
 
				+    aSig0, aSig1, bSig0, bSig1, q, term0, term1, term2: bits32;
			
 
				+    allZero, alternateASig0, alternateASig1, sigMean1: bits32;
			
 
				+    sigMean0: sbits32;
			
 
				+    z: float64;
			
 
				+    label invalid;
			
 
				+Begin
			
 
				+    aSig1 := extractFloat64Frac1( a );
			
 
				+    aSig0 := extractFloat64Frac0( a );
			
 
				+    aExp := extractFloat64Exp( a );
			
 
				+    aSign := extractFloat64Sign( a );
			
 
				+    bSig1 := extractFloat64Frac1( b );
			
 
				+    bSig0 := extractFloat64Frac0( b );
			
 
				+    bExp := extractFloat64Exp( b );
			
 
				+    bSign := extractFloat64Sign( b );
			
 
				+    if ( aExp = $7FF ) then
			
 
				+    Begin
			
 
				+        if ((( aSig0 OR  aSig1 )<>0)
			
 
				+             OR ( ( bExp = $7FF ) AND  (( bSig0 OR  bSig1 )<>0) ) ) then
			
 
				+        Begin
			
 
				+            propagateFloat64NaN( a, b, out );
			
 
				+            exit;
			
 
				+        End;
			
 
				+        goto invalid;
			
 
				+    End;
			
 
				+    if ( bExp = $7FF ) then
			
 
				+    Begin
			
 
				+        if ( bSig0 OR  bSig1 ) <> 0 then
			
 
				+        Begin
			
 
				+          propagateFloat64NaN( a, b, out );
			
 
				+          exit;
			
 
				+        End;
			
 
				+        out := a;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( bExp = 0 ) then
			
 
				+    Begin
			
 
				+        if ( ( bSig0 OR  bSig1 ) = 0 ) then
			
 
				+        Begin
			
 
				+ invalid:
			
 
				+            float_raise( float_flag_invalid );
			
 
				+            z.low := float64_default_nan_low;
			
 
				+            z.high := float64_default_nan_high;
			
 
				+            out := z;
			
 
				+            exit;
			
 
				+        End;
			
 
				+        normalizeFloat64Subnormal( bSig0, bSig1, bExp, bSig0, bSig1 );
			
 
				+    End;
			
 
				+    if ( aExp = 0 ) then
			
 
				+    Begin
			
 
				+        if ( ( aSig0 OR  aSig1 ) = 0 ) then
			
 
				+        Begin
			
 
				+           out := a;
			
 
				+           exit;
			
 
				+        End;
			
 
				+        normalizeFloat64Subnormal( aSig0, aSig1, aExp, aSig0, aSig1 );
			
 
				+    End;
			
 
				+    expDiff := aExp - bExp;
			
 
				+    if ( expDiff < -1 ) then
			
 
				+    Begin
			
 
				+       out := a;
			
 
				+       exit;
			
 
				+    End;
			
 
				+    shortShift64Left(
			
 
				+        aSig0 OR  $00100000, aSig1, 11 - flag( expDiff < 0 ), aSig0, aSig1 );
			
 
				+    shortShift64Left( bSig0 OR  $00100000, bSig1, 11, bSig0, bSig1 );
			
 
				+    q := le64( bSig0, bSig1, aSig0, aSig1 );
			
 
				+    if ( q )<>0 then
			
 
				+       sub64( aSig0, aSig1, bSig0, bSig1, aSig0, aSig1 );
			
 
				+    expDiff := expDiff - 32;
			
 
				+    while ( 0 < expDiff ) do
			
 
				+    Begin
			
 
				+        q := estimateDiv64To32( aSig0, aSig1, bSig0 );
			
 
				+        if 4 < q then
			
 
				+          q:= q - 4
			
 
				+        else
			
 
				+          q := 0;
			
 
				+        mul64By32To96( bSig0, bSig1, q, term0, term1, term2 );
			
 
				+        shortShift96Left( term0, term1, term2, 29, term1, term2, allZero );
			
 
				+        shortShift64Left( aSig0, aSig1, 29, aSig0, allZero );
			
 
				+        sub64( aSig0, 0, term1, term2, aSig0, aSig1 );
			
 
				+        expDiff := expDiff - 29;
			
 
				+    End;
			
 
				+    if ( -32 < expDiff ) then
			
 
				+    Begin
			
 
				+        q := estimateDiv64To32( aSig0, aSig1, bSig0 );
			
 
				+        if 4 < q then
			
 
				+          q := q - 4
			
 
				+        else
			
 
				+          q := 0;
			
 
				+        q := q shr (- expDiff);
			
 
				+        shift64Right( bSig0, bSig1, 8, bSig0, bSig1 );
			
 
				+        expDiff := expDiff + 24;
			
 
				+        if ( expDiff < 0 ) then
			
 
				+        Begin
			
 
				+            shift64Right( aSig0, aSig1, - expDiff, aSig0, aSig1 );
			
 
				+        End
			
 
				+        else
			
 
				+        Begin
			
 
				+            shortShift64Left( aSig0, aSig1, expDiff, aSig0, aSig1 );
			
 
				+        End;
			
 
				+        mul64By32To96( bSig0, bSig1, q, term0, term1, term2 );
			
 
				+        sub64( aSig0, aSig1, term1, term2, aSig0, aSig1 );
			
 
				+    End
			
 
				+    else
			
 
				+    Begin
			
 
				+        shift64Right( aSig0, aSig1, 8, aSig0, aSig1 );
			
 
				+        shift64Right( bSig0, bSig1, 8, bSig0, bSig1 );
			
 
				+    End;
			
 
				+    Repeat
			
 
				+        alternateASig0 := aSig0;
			
 
				+        alternateASig1 := aSig1;
			
 
				+        Inc(q);
			
 
				+        sub64( aSig0, aSig1, bSig0, bSig1, aSig0, aSig1 );
			
 
				+    Until not ( 0 <= sbits32 (aSig0) );
			
 
				+    add64(
			
 
				+        aSig0, aSig1, alternateASig0, alternateASig1, sigMean0, sigMean1 );
			
 
				+    if (    ( sigMean0 < 0 )
			
 
				+         OR ( ( ( sigMean0 OR  sigMean1 ) = 0 ) AND  (( q AND 1 )<>0) ) ) then
			
 
				+    Begin
			
 
				+        aSig0 := alternateASig0;
			
 
				+        aSig1 := alternateASig1;
			
 
				+    End;
			
 
				+    zSign := flag( sbits32 (aSig0) < 0 );
			
 
				+    if ( zSign <> 0 ) then
			
 
				+       sub64( 0, 0, aSig0, aSig1, aSig0, aSig1 );
			
 
				+    normalizeRoundAndPackFloat64( aSign xor zSign, bExp - 4, aSig0, aSig1, out );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns the square root of the double-precision floating-point value `a'.
			
 
				+The operation is performed according to the IEC/IEEE Standard for Binary
			
 
				+Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Procedure float64_sqrt( a: float64; var out: float64 );
			
 
				+Var
			
 
				+    aSign: flag;
			
 
				+    aExp, zExp: int16;
			
 
				+    aSig0, aSig1, zSig0, zSig1, zSig2, doubleZSig0: bits32;
			
 
				+    rem0, rem1, rem2, rem3, term0, term1, term2, term3: bits32;
			
 
				+    z: float64;
			
 
				+    label invalid;
			
 
				+Begin
			
 
				+    aSig1 := extractFloat64Frac1( a );
			
 
				+    aSig0 := extractFloat64Frac0( a );
			
 
				+    aExp := extractFloat64Exp( a );
			
 
				+    aSign := extractFloat64Sign( a );
			
 
				+    if ( aExp = $7FF ) then
			
 
				+    Begin
			
 
				+        if ( aSig0 OR  aSig1 ) <> 0 then
			
 
				+        Begin
			
 
				+           propagateFloat64NaN( a, a, out );
			
 
				+           exit;
			
 
				+        End;
			
 
				+        if ( aSign = 0) then
			
 
				+        Begin
			
 
				+          out := a;
			
 
				+          exit;
			
 
				+        End;
			
 
				+        goto invalid;
			
 
				+    End;
			
 
				+    if ( aSign <> 0 ) then
			
 
				+    Begin
			
 
				+        if ( ( aExp OR  aSig0 OR  aSig1 ) = 0 ) then
			
 
				+        Begin
			
 
				+           out := a;
			
 
				+           exit;
			
 
				+        End;
			
 
				+ invalid:
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        z.low := float64_default_nan_low;
			
 
				+        z.high := float64_default_nan_high;
			
 
				+        out := z;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if ( aExp = 0 ) then
			
 
				+    Begin
			
 
				+        if ( ( aSig0 OR  aSig1 ) = 0 ) then
			
 
				+        Begin
			
 
				+           packFloat64( 0, 0, 0, 0, out );
			
 
				+           exit;
			
 
				+        End;
			
 
				+        normalizeFloat64Subnormal( aSig0, aSig1, aExp, aSig0, aSig1 );
			
 
				+    End;
			
 
				+    zExp := ( ( aExp - $3FF ) shr 1 ) + $3FE;
			
 
				+    aSig0 := aSig0 or $00100000;
			
 
				+    shortShift64Left( aSig0, aSig1, 11, term0, term1 );
			
 
				+    zSig0 := ( estimateSqrt32( aExp, term0 ) shr 1 ) + 1;
			
 
				+    if ( zSig0 = 0 ) then
			
 
				+       zSig0 := $7FFFFFFF;
			
 
				+    doubleZSig0 := zSig0 + zSig0;
			
 
				+    shortShift64Left( aSig0, aSig1, 9 - ( aExp and 1 ), aSig0, aSig1 );
			
 
				+    mul32To64( zSig0, zSig0, term0, term1 );
			
 
				+    sub64( aSig0, aSig1, term0, term1, rem0, rem1 );
			
 
				+    while ( sbits32 (rem0) < 0 ) do
			
 
				+    Begin
			
 
				+        Dec(zSig0);
			
 
				+        doubleZSig0 := doubleZSig0 - 2;
			
 
				+        add64( rem0, rem1, 0, doubleZSig0 OR  1, rem0, rem1 );
			
 
				+    End;
			
 
				+    zSig1 := estimateDiv64To32( rem1, 0, doubleZSig0 );
			
 
				+    if ( ( zSig1 and $1FF ) <= 5 ) then
			
 
				+    Begin
			
 
				+        if ( zSig1 = 0 ) then
			
 
				+           zSig1 := 1;
			
 
				+        mul32To64( doubleZSig0, zSig1, term1, term2 );
			
 
				+        sub64( rem1, 0, term1, term2, rem1, rem2 );
			
 
				+        mul32To64( zSig1, zSig1, term2, term3 );
			
 
				+        sub96( rem1, rem2, 0, 0, term2, term3, rem1, rem2, rem3 );
			
 
				+        while ( sbits32 (rem1) < 0 ) do
			
 
				+        Begin
			
 
				+            Dec(zSig1);
			
 
				+            shortShift64Left( 0, zSig1, 1, term2, term3 );
			
 
				+            term3 := term3 or 1;
			
 
				+            term2 := term2 or doubleZSig0;
			
 
				+            add96( rem1, rem2, rem3, 0, term2, term3, rem1, rem2, rem3 );
			
 
				+        End;
			
 
				+        zSig1 := zSig1 or bits32( ( rem1 OR  rem2 OR  rem3 ) <> 0 );
			
 
				+    End;
			
 
				+    shift64ExtraRightJamming( zSig0, zSig1, 0, 10, zSig0, zSig1, zSig2 );
			
 
				+    roundAndPackFloat64( 0, zExp, zSig0, zSig1, zSig2, out );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the double-precision floating-point value `a' is equal to
			
 
				+the corresponding value `b', and 0 otherwise.  The comparison is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_eq(a: float64; b: float64): flag;
			
 
				+Begin
			
 
				+    if
			
 
				+         (
			
 
				+                ( extractFloat64Exp( a ) = $7FF )
			
 
				+            AND
			
 
				+                (
			
 
				+                    (extractFloat64Frac0( a )  OR  extractFloat64Frac1( a )) <>0
			
 
				+                )
			
 
				+         )
			
 
				+         OR (
			
 
				+                ( extractFloat64Exp( b ) = $7FF )
			
 
				+           AND  (
			
 
				+                    (extractFloat64Frac0( b ) OR  (extractFloat64Frac1( b )) <> 0
			
 
				+                )
			
 
				+           )
			
 
				+       ) then
			
 
				+    Begin
			
 
				+        if ( (float64_is_signaling_nan( a )<>0) OR (float64_is_signaling_nan( b )<>0) ) then
			
 
				+            float_raise( float_flag_invalid );
			
 
				+        float64_eq := 0;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    float64_eq := flag(
			
 
				+           ( a.low = b.low )
			
 
				+        AND  (    ( a.high = b.high )
			
 
				+             OR (    ( a.low = 0 )
			
 
				+                  AND  ( bits32 ( ( a.high OR  b.high ) shl 1 ) = 0 ) )
			
 
				+           ));
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the double-precision floating-point value `a' is less than
			
 
				+or equal to the corresponding value `b', and 0 otherwise.  The comparison
			
 
				+is performed according to the IEC/IEEE Standard for Binary Floating-Point
			
 
				+Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_le(a: float64;b: float64): flag;
			
 
				+Var
			
 
				+    aSign, bSign: flag;
			
 
				+Begin
			
 
				+    if
			
 
				+         (
			
 
				+                ( extractFloat64Exp( a ) = $7FF )
			
 
				+            AND
			
 
				+                (
			
 
				+                    (extractFloat64Frac0( a )  OR  extractFloat64Frac1( a )) <>0
			
 
				+                )
			
 
				+         )
			
 
				+         OR (
			
 
				+                ( extractFloat64Exp( b ) = $7FF )
			
 
				+           AND  (
			
 
				+                    (extractFloat64Frac0( b ) OR  (extractFloat64Frac1( b )) <> 0
			
 
				+                )
			
 
				+           )
			
 
				+       ) then
			
 
				+    Begin
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        float64_le := 0;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    aSign := extractFloat64Sign( a );
			
 
				+    bSign := extractFloat64Sign( b );
			
 
				+    if ( aSign <> bSign ) then
			
 
				+    Begin
			
 
				+        float64_le := flag(
			
 
				+               (aSign <> 0)
			
 
				+            OR (    ( ( bits32 ( ( a.high OR  b.high ) shl 1 ) ) OR  a.low OR  b.low )
			
 
				+                 = 0 ));
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if aSign <> 0 then
			
 
				+      float64_le := le64( b.high, b.low, a.high, a.low )
			
 
				+    else
			
 
				+      float64_le := le64( a.high, a.low, b.high, b.low );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the double-precision floating-point value `a' is less than
			
 
				+the corresponding value `b', and 0 otherwise.  The comparison is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_lt(a: float64;b: float64): flag;
			
 
				+Var
			
 
				+    aSign, bSign: flag;
			
 
				+Begin
			
 
				+    if
			
 
				+         (
			
 
				+                ( extractFloat64Exp( a ) = $7FF )
			
 
				+            AND
			
 
				+                (
			
 
				+                    (extractFloat64Frac0( a )  OR  extractFloat64Frac1( a )) <>0
			
 
				+                )
			
 
				+         )
			
 
				+         OR (
			
 
				+                ( extractFloat64Exp( b ) = $7FF )
			
 
				+           AND  (
			
 
				+                    (extractFloat64Frac0( b ) OR  (extractFloat64Frac1( b )) <> 0
			
 
				+                )
			
 
				+           )
			
 
				+       ) then
			
 
				+    Begin
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        float64_lt := 0;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    aSign := extractFloat64Sign( a );
			
 
				+    bSign := extractFloat64Sign( b );
			
 
				+    if ( aSign <> bSign ) then
			
 
				+    Begin
			
 
				+        float64_lt := flag(
			
 
				+               (aSign <> 0)
			
 
				+            AND  (    ( ( bits32 ( ( a.high OR  b.high ) shl 1 ) ) OR  a.low OR  b.low )
			
 
				+                 <> 0 ));
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if aSign <> 0 then
			
 
				+       float64_lt := lt64( b.high, b.low, a.high, a.low )
			
 
				+    else
			
 
				+       float64_lt := lt64( a.high, a.low, b.high, b.low );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the double-precision floating-point value `a' is equal to
			
 
				+the corresponding value `b', and 0 otherwise.  The invalid exception is
			
 
				+raised if either operand is a NaN.  Otherwise, the comparison is performed
			
 
				+according to the IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_eq_signaling( a: float64; b: float64): flag;
			
 
				+Begin
			
 
				+
			
 
				+    if
			
 
				+         (
			
 
				+                ( extractFloat64Exp( a ) = $7FF )
			
 
				+            AND
			
 
				+                (
			
 
				+                    (extractFloat64Frac0( a )  OR  extractFloat64Frac1( a )) <>0
			
 
				+                )
			
 
				+         )
			
 
				+         OR (
			
 
				+                ( extractFloat64Exp( b ) = $7FF )
			
 
				+           AND  (
			
 
				+                    (extractFloat64Frac0( b ) OR  (extractFloat64Frac1( b )) <> 0
			
 
				+                )
			
 
				+           )
			
 
				+       ) then
			
 
				+    Begin
			
 
				+        float_raise( float_flag_invalid );
			
 
				+        float64_eq_signaling := 0;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    float64_eq_signaling := flag(
			
 
				+           ( a.low = b.low )
			
 
				+        AND  (    ( a.high = b.high )
			
 
				+             OR (    ( a.low = 0 )
			
 
				+                  AND  ( bits32 ( ( a.high OR  b.high ) shl 1 ) = 0 ) )
			
 
				+           ));
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the double-precision floating-point value `a' is less than or
			
 
				+equal to the corresponding value `b', and 0 otherwise.  Quiet NaNs do not
			
 
				+cause an exception.  Otherwise, the comparison is performed according to the
			
 
				+IEC/IEEE Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_le_quiet(a: float64 ; b: float64 ): flag;
			
 
				+Var
			
 
				+    aSign, bSign : flag;
			
 
				+Begin
			
 
				+    if
			
 
				+         (
			
 
				+                ( extractFloat64Exp( a ) = $7FF )
			
 
				+            AND
			
 
				+                (
			
 
				+                    (extractFloat64Frac0( a )  OR  extractFloat64Frac1( a )) <>0
			
 
				+                )
			
 
				+         )
			
 
				+         OR (
			
 
				+                ( extractFloat64Exp( b ) = $7FF )
			
 
				+           AND  (
			
 
				+                    (extractFloat64Frac0( b ) OR  (extractFloat64Frac1( b )) <> 0
			
 
				+                )
			
 
				+           )
			
 
				+       ) then
			
 
				+    Begin
			
 
				+        if ( (float64_is_signaling_nan( a )<>0)  OR (float64_is_signaling_nan( b )<>0) ) then
			
 
				+            float_raise( float_flag_invalid );
			
 
				+        float64_le_quiet := 0;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    aSign := extractFloat64Sign( a );
			
 
				+    bSign := extractFloat64Sign( b );
			
 
				+    if ( aSign <> bSign ) then
			
 
				+    Begin
			
 
				+     float64_le_quiet := flag
			
 
				+      ((aSign <> 0)
			
 
				+            OR (    ( ( bits32 ( ( a.high OR  b.high ) shl 1 ) ) OR  a.low OR  b.low )
			
 
				+                 = 0 ));
			
 
				+        exit;
			
 
				+    End;
			
 
				+    if aSign <> 0 then
			
 
				+      float64_le_quiet := le64( b.high, b.low, a.high, a.low )
			
 
				+    else
			
 
				+      float64_le_quiet := le64( a.high, a.low, b.high, b.low );
			
 
				+End;
			
 
				+
			
 
				+{*
			
 
				+-------------------------------------------------------------------------------
			
 
				+Returns 1 if the double-precision floating-point value `a' is less than
			
 
				+the corresponding value `b', and 0 otherwise.  Quiet NaNs do not cause an
			
 
				+exception.  Otherwise, the comparison is performed according to the IEC/IEEE
			
 
				+Standard for Binary Floating-Point Arithmetic.
			
 
				+-------------------------------------------------------------------------------
			
 
				+*}
			
 
				+Function float64_lt_quiet(a: float64; b: float64 ): Flag;
			
 
				+Var
			
 
				+    aSign, bSign: flag;
			
 
				+Begin
			
 
				+    if
			
 
				+         (
			
 
				+                ( extractFloat64Exp( a ) = $7FF )
			
 
				+            AND
			
 
				+                (
			
 
				+                    (extractFloat64Frac0( a )  OR  extractFloat64Frac1( a )) <>0
			
 
				+                )
			
 
				+         )
			
 
				+         OR (
			
 
				+                ( extractFloat64Exp( b ) = $7FF )
			
 
				+           AND  (
			
 
				+                    (extractFloat64Frac0( b ) OR  (extractFloat64Frac1( b )) <> 0
			
 
				+                )
			
 
				+           )
			
 
				+       ) then
			
 
				+    Begin
			
 
				+        if ( (float64_is_signaling_nan( a )<>0) OR (float64_is_signaling_nan( b )<>0) ) then
			
 
				+            float_raise( float_flag_invalid );
			
 
				+        float64_lt_quiet := 0;
			
 
				+        exit;
			
 
				+    End;
			
 
				+    aSign := extractFloat64Sign( a );
			
 
				+    bSign := extractFloat64Sign( b );
			
 
				+    if ( aSign <> bSign ) then
			
 
				+    Begin
			
 
				+      float64_lt_quiet := flag(
			
 
				+               (aSign<>0)
			
 
				+            AND  (    ( ( bits32 ( ( a.high OR  b.high ) shl 1 ) ) OR  a.low OR  b.low )
			
 
				+                 <> 0 ));
			
 
				+        exit;
			
 
				+    End;
			
 
				+    If aSign <> 0 then
			
 
				+      float64_lt_quiet :=  lt64( b.high, b.low, a.high, a.low )
			
 
				+    else
			
 
				+      float64_lt_quiet := lt64( a.high, a.low, b.high, b.low );
			
 
				+End;
			
 
				+
			
 
				+end.
			
 
				+{
			
 
				+   $Log$
			
 
				+   Revision 1.1  2002-09-16 19:10:17  carl
			
 
				+     * first revision of FPU emulation
			
 
				+
			
 
				+}