123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447 |
- {
- File: vecLib/vBLAS.h
-
- Contains: Header for the Basic Linear Algebra Subprograms, with Apple extensions.
-
- Version: vecLib-$(vDSP_Version0).$(vDSP_Version1)
-
- Copyright: © 2000-$(Year) by Apple Computer, Inc., all rights reserved.
-
- Bugs?: For bug reports, consult the following page on
- the World Wide Web:
-
- http://bugs.freepascal.org
-
- }
- { Pascal Translation Updated: Jonas Maebe, <[email protected]>, October 2009 }
- { Pascal Translation Updated: Jonas Maebe, <[email protected]>, October 2012 }
- {
- Modified for use with Free Pascal
- Version 308
- Please report any bugs to <[email protected]>
- }
- {$ifc not defined MACOSALLINCLUDE or not MACOSALLINCLUDE}
- {$mode macpas}
- {$modeswitch cblocks}
- {$packenum 1}
- {$macro on}
- {$inline on}
- {$calling mwpascal}
- unit vBLAS;
- interface
- {$setc UNIVERSAL_INTERFACES_VERSION := $0400}
- {$setc GAP_INTERFACES_VERSION := $0308}
- {$ifc not defined USE_CFSTR_CONSTANT_MACROS}
- {$setc USE_CFSTR_CONSTANT_MACROS := TRUE}
- {$endc}
- {$ifc defined CPUPOWERPC and defined CPUI386}
- {$error Conflicting initial definitions for CPUPOWERPC and CPUI386}
- {$endc}
- {$ifc defined FPC_BIG_ENDIAN and defined FPC_LITTLE_ENDIAN}
- {$error Conflicting initial definitions for FPC_BIG_ENDIAN and FPC_LITTLE_ENDIAN}
- {$endc}
- {$ifc not defined __ppc__ and defined CPUPOWERPC32}
- {$setc __ppc__ := 1}
- {$elsec}
- {$setc __ppc__ := 0}
- {$endc}
- {$ifc not defined __ppc64__ and defined CPUPOWERPC64}
- {$setc __ppc64__ := 1}
- {$elsec}
- {$setc __ppc64__ := 0}
- {$endc}
- {$ifc not defined __i386__ and defined CPUI386}
- {$setc __i386__ := 1}
- {$elsec}
- {$setc __i386__ := 0}
- {$endc}
- {$ifc not defined __x86_64__ and defined CPUX86_64}
- {$setc __x86_64__ := 1}
- {$elsec}
- {$setc __x86_64__ := 0}
- {$endc}
- {$ifc not defined __arm__ and defined CPUARM}
- {$setc __arm__ := 1}
- {$elsec}
- {$setc __arm__ := 0}
- {$endc}
- {$ifc not defined __arm64__ and defined CPUAARCH64}
- {$setc __arm64__ := 1}
- {$elsec}
- {$setc __arm64__ := 0}
- {$endc}
- {$ifc defined cpu64}
- {$setc __LP64__ := 1}
- {$elsec}
- {$setc __LP64__ := 0}
- {$endc}
- {$ifc defined __ppc__ and __ppc__ and defined __i386__ and __i386__}
- {$error Conflicting definitions for __ppc__ and __i386__}
- {$endc}
- {$ifc defined __ppc__ and __ppc__}
- {$setc TARGET_CPU_PPC := TRUE}
- {$setc TARGET_CPU_PPC64 := FALSE}
- {$setc TARGET_CPU_X86 := FALSE}
- {$setc TARGET_CPU_X86_64 := FALSE}
- {$setc TARGET_CPU_ARM := FALSE}
- {$setc TARGET_CPU_ARM64 := FALSE}
- {$setc TARGET_OS_MAC := TRUE}
- {$setc TARGET_OS_IPHONE := FALSE}
- {$setc TARGET_IPHONE_SIMULATOR := FALSE}
- {$setc TARGET_OS_EMBEDDED := FALSE}
- {$elifc defined __ppc64__ and __ppc64__}
- {$setc TARGET_CPU_PPC := FALSE}
- {$setc TARGET_CPU_PPC64 := TRUE}
- {$setc TARGET_CPU_X86 := FALSE}
- {$setc TARGET_CPU_X86_64 := FALSE}
- {$setc TARGET_CPU_ARM := FALSE}
- {$setc TARGET_CPU_ARM64 := FALSE}
- {$setc TARGET_OS_MAC := TRUE}
- {$setc TARGET_OS_IPHONE := FALSE}
- {$setc TARGET_IPHONE_SIMULATOR := FALSE}
- {$setc TARGET_OS_EMBEDDED := FALSE}
- {$elifc defined __i386__ and __i386__}
- {$setc TARGET_CPU_PPC := FALSE}
- {$setc TARGET_CPU_PPC64 := FALSE}
- {$setc TARGET_CPU_X86 := TRUE}
- {$setc TARGET_CPU_X86_64 := FALSE}
- {$setc TARGET_CPU_ARM := FALSE}
- {$setc TARGET_CPU_ARM64 := FALSE}
- {$ifc defined iphonesim}
- {$setc TARGET_OS_MAC := FALSE}
- {$setc TARGET_OS_IPHONE := TRUE}
- {$setc TARGET_IPHONE_SIMULATOR := TRUE}
- {$elsec}
- {$setc TARGET_OS_MAC := TRUE}
- {$setc TARGET_OS_IPHONE := FALSE}
- {$setc TARGET_IPHONE_SIMULATOR := FALSE}
- {$endc}
- {$setc TARGET_OS_EMBEDDED := FALSE}
- {$elifc defined __x86_64__ and __x86_64__}
- {$setc TARGET_CPU_PPC := FALSE}
- {$setc TARGET_CPU_PPC64 := FALSE}
- {$setc TARGET_CPU_X86 := FALSE}
- {$setc TARGET_CPU_X86_64 := TRUE}
- {$setc TARGET_CPU_ARM := FALSE}
- {$setc TARGET_CPU_ARM64 := FALSE}
- {$ifc defined iphonesim}
- {$setc TARGET_OS_MAC := FALSE}
- {$setc TARGET_OS_IPHONE := TRUE}
- {$setc TARGET_IPHONE_SIMULATOR := TRUE}
- {$elsec}
- {$setc TARGET_OS_MAC := TRUE}
- {$setc TARGET_OS_IPHONE := FALSE}
- {$setc TARGET_IPHONE_SIMULATOR := FALSE}
- {$endc}
- {$setc TARGET_OS_EMBEDDED := FALSE}
- {$elifc defined __arm__ and __arm__}
- {$setc TARGET_CPU_PPC := FALSE}
- {$setc TARGET_CPU_PPC64 := FALSE}
- {$setc TARGET_CPU_X86 := FALSE}
- {$setc TARGET_CPU_X86_64 := FALSE}
- {$setc TARGET_CPU_ARM := TRUE}
- {$setc TARGET_CPU_ARM64 := FALSE}
- {$setc TARGET_OS_MAC := FALSE}
- {$setc TARGET_OS_IPHONE := TRUE}
- {$setc TARGET_IPHONE_SIMULATOR := FALSE}
- {$setc TARGET_OS_EMBEDDED := TRUE}
- {$elifc defined __arm64__ and __arm64__}
- {$setc TARGET_CPU_PPC := FALSE}
- {$setc TARGET_CPU_PPC64 := FALSE}
- {$setc TARGET_CPU_X86 := FALSE}
- {$setc TARGET_CPU_X86_64 := FALSE}
- {$setc TARGET_CPU_ARM := FALSE}
- {$setc TARGET_CPU_ARM64 := TRUE}
- {$ifc defined ios}
- {$setc TARGET_OS_MAC := FALSE}
- {$setc TARGET_OS_IPHONE := TRUE}
- {$setc TARGET_OS_EMBEDDED := TRUE}
- {$elsec}
- {$setc TARGET_OS_MAC := TRUE}
- {$setc TARGET_OS_IPHONE := FALSE}
- {$setc TARGET_OS_EMBEDDED := FALSE}
- {$endc}
- {$setc TARGET_IPHONE_SIMULATOR := FALSE}
- {$elsec}
- {$error __ppc__ nor __ppc64__ nor __i386__ nor __x86_64__ nor __arm__ nor __arm64__ is defined.}
- {$endc}
- {$ifc defined __LP64__ and __LP64__ }
- {$setc TARGET_CPU_64 := TRUE}
- {$elsec}
- {$setc TARGET_CPU_64 := FALSE}
- {$endc}
- {$ifc defined FPC_BIG_ENDIAN}
- {$setc TARGET_RT_BIG_ENDIAN := TRUE}
- {$setc TARGET_RT_LITTLE_ENDIAN := FALSE}
- {$elifc defined FPC_LITTLE_ENDIAN}
- {$setc TARGET_RT_BIG_ENDIAN := FALSE}
- {$setc TARGET_RT_LITTLE_ENDIAN := TRUE}
- {$elsec}
- {$error Neither FPC_BIG_ENDIAN nor FPC_LITTLE_ENDIAN are defined.}
- {$endc}
- {$setc ACCESSOR_CALLS_ARE_FUNCTIONS := TRUE}
- {$setc CALL_NOT_IN_CARBON := FALSE}
- {$setc OLDROUTINENAMES := FALSE}
- {$setc OPAQUE_TOOLBOX_STRUCTS := TRUE}
- {$setc OPAQUE_UPP_TYPES := TRUE}
- {$setc OTCARBONAPPLICATION := TRUE}
- {$setc OTKERNEL := FALSE}
- {$setc PM_USE_SESSION_APIS := TRUE}
- {$setc TARGET_API_MAC_CARBON := TRUE}
- {$setc TARGET_API_MAC_OS8 := FALSE}
- {$setc TARGET_API_MAC_OSX := TRUE}
- {$setc TARGET_CARBON := TRUE}
- {$setc TARGET_CPU_68K := FALSE}
- {$setc TARGET_CPU_MIPS := FALSE}
- {$setc TARGET_CPU_SPARC := FALSE}
- {$setc TARGET_OS_UNIX := FALSE}
- {$setc TARGET_OS_WIN32 := FALSE}
- {$setc TARGET_RT_MAC_68881 := FALSE}
- {$setc TARGET_RT_MAC_CFM := FALSE}
- {$setc TARGET_RT_MAC_MACHO := TRUE}
- {$setc TYPED_FUNCTION_POINTERS := TRUE}
- {$setc TYPE_BOOL := FALSE}
- {$setc TYPE_EXTENDED := FALSE}
- {$setc TYPE_LONGLONG := TRUE}
- uses MacTypes,ConditionalMacros;
- {$endc} {not MACOSALLINCLUDE}
- {$ifc TARGET_OS_MAC}
- {$ALIGN POWER}
- { ==========================================================================================================================}
- {
- =================================================================================================
- Definitions of the Basic Linear Algebra Subprograms (BLAS) as provided Apple Computer.
- A few additional functions, unique to Mac OS, have also been provided.
- These are clearly documented as Apple extensions.
- Documentation on the BLAS standard, including reference implementations, can be found on the web
- starting from the BLAS FAQ page at these URLs (verified live as of April 2002):
- http://www.netlib.org/blas/faq.html
- http://www.netlib.org/blas/blast-forum/blast-forum.html
- =================================================================================================
- }
- {
- =================================================================================================
- Matrix shape and storage
- ========================
- Keeping the various matrix shape and storage parameters straight can be difficult. The BLAS
- documentation generally makes a distinction between the concpetual "matrix" and the physical
- "array". However there are a number of places where this becomes fuzzy because of the overall
- bias towards FORTRAN's column major storage. The confusion is made worse by style differences
- between the level 2 and level 3 functions. It is amplified further by the explicit choice of row
- or column major storage in the C interface.
- The storage order does not affect the actual computation that is performed. That is, it does not
- affect the results other than where they appear in memory. It does affect the values passed
- for so-called "leading dimension" parameters, such as lda in sgemv. These are always the major
- stride in storage, allowing operations on rectangular subsets of larger matrices. For row major
- storage this is the number of columns in the parent matrix, and for column major storage this is
- the number of rows in the parent matrix.
- For the level 2 functions, which deal with only a single matrix, the matrix shape parameters are
- always M and N. These are the logical shape of the matrix, M rows by N columns. The transpose
- parameter, such as transA in sgemv, defines whether the regular matrix or its transpose is used
- in the operation. This affects the implicit length of the input and output vectors. For example,
- if the regular matrix A is used in sgemv, the input vector X has length N, the number of columns
- of A, and the output vector Y has length M, the number of rows of A. The length of the input and
- output vectors is not affected by the storage order of the matrix.
- The level 3 functions deal with 2 input matrices and one output matrix, the matrix shape parameters
- are M, N, and K. The logical shape of the output matrix is always M by N, while K is the common
- dimension of the input matrices. Like level 2, the transpose parameters, such as transA and transB
- in sgemm, define whether the regular input or its transpose is used in the operation. However
- unlike level 2, in level 3 the transpose parameters affect the implicit shape of the input matrix.
- Consider sgemm, which computes "C = (alpha * A * B) + (beta * C)", where A and B might be regular
- or transposed. The logical shape of C is always M rows by N columns. The physical shape depends
- on the storage order parameter. Using column major storage the declaration of C (the array) in C
- (the language) would be something like "float C[N][M]". The logical shape of A without transposition
- is M by K, and B is K by N. The one storage order parameter affects all three matrices.
- For those readers still wondering about the style differences between level 2 and level 3, they
- involve whether the input or output shapes are explicit. For level 2, the input matrix shape is
- always M by N. The input and output vector lengths are implicit and vary according to the
- transpose parameter. For level 3, the output matrix shape is always M by N. The input matrix
- shapes are implicit and vary according to the transpose parameters.
- =================================================================================================
- }
- { ==========================================================================================================================}
- {
- ------------------------------------------------------------------------------------------------------------------
- IsAlignedCount - True if an integer is positive and a multiple of 4. Negative strides are considered unaligned.
- IsAlignedAddr - True if an address is a multiple of 16.
- }
- // #define IsAlignedCount(n) ( (n > 0) && ((n & 3) == 0) )
- // #define IsAlignedAddr(a) ( ((long)a & 15L) == 0 )
- {
- =================================================================================================
- Prototypes for FORTRAN BLAS
- ===========================
- These are prototypes for the FORTRAN callable BLAS functions. They are implemented in C for
- Mac OS, as thin shims that simply call the C BLAS counterpart. These routines should never be
- called from C, but need to be included here so they will get output for the stub library. It
- won't hurt to call them from C, but who would want to since you can't pass literals for sizes?
- FORTRAN compilers are typically MPW tools and use PPCLink, so they will link with the official
- vecLib stub from Apple.
- =================================================================================================
- }
- {
- * SDOT()
- *
- * Availability:
- * Mac OS X: in version 10.0 and later in vecLib.framework
- * CarbonLib: not in Carbon, but vecLib is compatible with CarbonLib
- * Non-Carbon CFM: in vecLib 1.0.2 and later
- }
- function SDOT( (*const*) var N: SInt32; {const} X: Float32Ptr; (*const*) var incX: SInt32; {const} Y: Float32Ptr; (*const*) var incY: SInt32 ): Float32; external name '_SDOT';
- (* AVAILABLE_MAC_OS_X_VERSION_10_0_AND_LATER *)
- {
- * SNRM2()
- *
- * Availability:
- * Mac OS X: in version 10.0 and later in vecLib.framework
- * CarbonLib: not in Carbon, but vecLib is compatible with CarbonLib
- * Non-Carbon CFM: in vecLib 1.0.2 and later
- }
- function SNRM2( (*const*) var N: SInt32; {const} X: Float32Ptr; (*const*) var incX: SInt32 ): Float32; external name '_SNRM2';
- (* AVAILABLE_MAC_OS_X_VERSION_10_0_AND_LATER *)
- {
- * SASUM()
- *
- * Availability:
- * Mac OS X: in version 10.0 and later in vecLib.framework
- * CarbonLib: not in Carbon, but vecLib is compatible with CarbonLib
- * Non-Carbon CFM: in vecLib 1.0.2 and later
- }
- function SASUM( (*const*) var N: SInt32; {const} X: Float32Ptr; (*const*) var incX: SInt32 ): Float32; external name '_SASUM';
- (* AVAILABLE_MAC_OS_X_VERSION_10_0_AND_LATER *)
- {
- * ISAMAX()
- *
- * Availability:
- * Mac OS X: in version 10.0 and later in vecLib.framework
- * CarbonLib: not in Carbon, but vecLib is compatible with CarbonLib
- * Non-Carbon CFM: in vecLib 1.0.2 and later
- }
- function ISAMAX( (*const*) var N: SInt32; {const} X: Float32Ptr; (*const*) var incX: SInt32 ): SInt32; external name '_ISAMAX';
- (* AVAILABLE_MAC_OS_X_VERSION_10_0_AND_LATER *)
- {
- * SSWAP()
- *
- * Availability:
- * Mac OS X: in version 10.0 and later in vecLib.framework
- * CarbonLib: not in Carbon, but vecLib is compatible with CarbonLib
- * Non-Carbon CFM: in vecLib 1.0.2 and later
- }
- procedure SSWAP( (*const*) var N: SInt32; X: Float32Ptr; (*const*) var incX: SInt32; Y: Float32Ptr; (*const*) var incY: SInt32 ); external name '_SSWAP';
- (* AVAILABLE_MAC_OS_X_VERSION_10_0_AND_LATER *)
- {
- * SCOPY()
- *
- * Availability:
- * Mac OS X: in version 10.0 and later in vecLib.framework
- * CarbonLib: not in Carbon, but vecLib is compatible with CarbonLib
- * Non-Carbon CFM: in vecLib 1.0.2 and later
- }
- procedure SCOPY( (*const*) var N: SInt32; {const} X: Float32Ptr; (*const*) var incX: SInt32; Y: Float32Ptr; (*const*) var incY: SInt32 ); external name '_SCOPY';
- (* AVAILABLE_MAC_OS_X_VERSION_10_0_AND_LATER *)
- {
- * SAXPY()
- *
- * Availability:
- * Mac OS X: in version 10.0 and later in vecLib.framework
- * CarbonLib: not in Carbon, but vecLib is compatible with CarbonLib
- * Non-Carbon CFM: in vecLib 1.0.2 and later
- }
- procedure SAXPY( (*const*) var N: SInt32; const (*var*) alpha: Float32; {const} X: Float32Ptr; (*const*) var incX: SInt32; Y: Float32Ptr; (*const*) var incY: SInt32 ); external name '_SAXPY';
- (* AVAILABLE_MAC_OS_X_VERSION_10_0_AND_LATER *)
- {
- * SROT()
- *
- * Availability:
- * Mac OS X: in version 10.0 and later in vecLib.framework
- * CarbonLib: not in Carbon, but vecLib is compatible with CarbonLib
- * Non-Carbon CFM: in vecLib 1.0.2 and later
- }
- procedure SROT( (*const*) var N: SInt32; X: Float32Ptr; (*const*) var incX: SInt32; Y: Float32Ptr; (*const*) var incY: SInt32; const (*var*) c: Float32; const (*var*) s: Float32 ); external name '_SROT';
- (* AVAILABLE_MAC_OS_X_VERSION_10_0_AND_LATER *)
- {
- * SSCAL()
- *
- * Availability:
- * Mac OS X: in version 10.0 and later in vecLib.framework
- * CarbonLib: not in Carbon, but vecLib is compatible with CarbonLib
- * Non-Carbon CFM: in vecLib 1.0.2 and later
- }
- procedure SSCAL( (*const*) var N: SInt32; const (*var*) alpha: Float32; X: Float32Ptr; (*const*) var incX: SInt32 ); external name '_SSCAL';
- (* AVAILABLE_MAC_OS_X_VERSION_10_0_AND_LATER *)
- {
- * SGEMV()
- *
- * Availability:
- * Mac OS X: in version 10.0 and later in vecLib.framework
- * CarbonLib: not in Carbon, but vecLib is compatible with CarbonLib
- * Non-Carbon CFM: in vecLib 1.0.2 and later
- }
- procedure SGEMV( transA: ConstCStringPtr; (*const*) var M: SInt32; (*const*) var N: SInt32; const (*var*) alpha: Float32; {const} A: Float32Ptr; (*const*) var lda: SInt32; {const} X: Float32Ptr; (*const*) var incX: SInt32; const (*var*) beta: Float32; Y: Float32Ptr; (*const*) var incY: SInt32 ); external name '_SGEMV';
- (* AVAILABLE_MAC_OS_X_VERSION_10_0_AND_LATER *)
- {
- * SGEMM()
- *
- * Availability:
- * Mac OS X: in version 10.0 and later in vecLib.framework
- * CarbonLib: not in Carbon, but vecLib is compatible with CarbonLib
- * Non-Carbon CFM: in vecLib 1.0.2 and later
- }
- procedure SGEMM( transA: ConstCStringPtr; transB: ConstCStringPtr; (*const*) var M: SInt32; (*const*) var N: SInt32; (*const*) var K: SInt32; const (*var*) alpha: Float32; {const} A: Float32Ptr; (*const*) var lda: SInt32; {const} B: Float32Ptr; (*const*) var ldb: SInt32; const (*var*) beta: Float32; C: Float32Ptr; (*const*) var ldc: SInt32 ); external name '_SGEMM';
- (* AVAILABLE_MAC_OS_X_VERSION_10_0_AND_LATER *)
- { ==========================================================================================================================}
- { ==========================================================================================================================}
- {$endc} {TARGET_OS_MAC}
- {$ifc not defined MACOSALLINCLUDE or not MACOSALLINCLUDE}
- end.
- {$endc} {not MACOSALLINCLUDE}
|