math.odin 74 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356
  1. package math
  2. import "core:intrinsics"
  3. import "core:builtin"
  4. _ :: intrinsics
  5. Float_Class :: enum {
  6. Normal, // an ordinary nonzero floating point value
  7. Subnormal, // a subnormal floating point value
  8. Zero, // zero
  9. Neg_Zero, // the negative zero
  10. NaN, // Not-A-Number (NaN)
  11. Inf, // positive infinity
  12. Neg_Inf, // negative infinity
  13. }
  14. TAU :: 6.28318530717958647692528676655900576
  15. PI :: 3.14159265358979323846264338327950288
  16. E :: 2.71828182845904523536
  17. τ :: TAU
  18. π :: PI
  19. e :: E
  20. SQRT_TWO :: 1.41421356237309504880168872420969808
  21. SQRT_THREE :: 1.73205080756887729352744634150587236
  22. SQRT_FIVE :: 2.23606797749978969640917366873127623
  23. LN2 :: 0.693147180559945309417232121458176568
  24. LN10 :: 2.30258509299404568401799145468436421
  25. MAX_F64_PRECISION :: 16 // Maximum number of meaningful digits after the decimal point for 'f64'
  26. MAX_F32_PRECISION :: 8 // Maximum number of meaningful digits after the decimal point for 'f32'
  27. MAX_F16_PRECISION :: 4 // Maximum number of meaningful digits after the decimal point for 'f16'
  28. RAD_PER_DEG :: TAU/360.0
  29. DEG_PER_RAD :: 360.0/TAU
  30. abs :: builtin.abs
  31. min :: builtin.min
  32. max :: builtin.max
  33. clamp :: builtin.clamp
  34. @(require_results) sqrt_f16le :: proc "contextless" (x: f16le) -> f16le { return #force_inline f16le(sqrt_f16(f16(x))) }
  35. @(require_results) sqrt_f16be :: proc "contextless" (x: f16be) -> f16be { return #force_inline f16be(sqrt_f16(f16(x))) }
  36. @(require_results) sqrt_f32le :: proc "contextless" (x: f32le) -> f32le { return #force_inline f32le(sqrt_f32(f32(x))) }
  37. @(require_results) sqrt_f32be :: proc "contextless" (x: f32be) -> f32be { return #force_inline f32be(sqrt_f32(f32(x))) }
  38. @(require_results) sqrt_f64le :: proc "contextless" (x: f64le) -> f64le { return #force_inline f64le(sqrt_f64(f64(x))) }
  39. @(require_results) sqrt_f64be :: proc "contextless" (x: f64be) -> f64be { return #force_inline f64be(sqrt_f64(f64(x))) }
  40. sqrt :: proc{
  41. sqrt_f16, sqrt_f16le, sqrt_f16be,
  42. sqrt_f32, sqrt_f32le, sqrt_f32be,
  43. sqrt_f64, sqrt_f64le, sqrt_f64be,
  44. }
  45. @(require_results) sin_f16le :: proc "contextless" (θ: f16le) -> f16le { return #force_inline f16le(sin_f16(f16(θ))) }
  46. @(require_results) sin_f16be :: proc "contextless" (θ: f16be) -> f16be { return #force_inline f16be(sin_f16(f16(θ))) }
  47. @(require_results) sin_f32le :: proc "contextless" (θ: f32le) -> f32le { return #force_inline f32le(sin_f32(f32(θ))) }
  48. @(require_results) sin_f32be :: proc "contextless" (θ: f32be) -> f32be { return #force_inline f32be(sin_f32(f32(θ))) }
  49. @(require_results) sin_f64le :: proc "contextless" (θ: f64le) -> f64le { return #force_inline f64le(sin_f64(f64(θ))) }
  50. @(require_results) sin_f64be :: proc "contextless" (θ: f64be) -> f64be { return #force_inline f64be(sin_f64(f64(θ))) }
  51. sin :: proc{
  52. sin_f16, sin_f16le, sin_f16be,
  53. sin_f32, sin_f32le, sin_f32be,
  54. sin_f64, sin_f64le, sin_f64be,
  55. }
  56. @(require_results) cos_f16le :: proc "contextless" (θ: f16le) -> f16le { return #force_inline f16le(cos_f16(f16(θ))) }
  57. @(require_results) cos_f16be :: proc "contextless" (θ: f16be) -> f16be { return #force_inline f16be(cos_f16(f16(θ))) }
  58. @(require_results) cos_f32le :: proc "contextless" (θ: f32le) -> f32le { return #force_inline f32le(cos_f32(f32(θ))) }
  59. @(require_results) cos_f32be :: proc "contextless" (θ: f32be) -> f32be { return #force_inline f32be(cos_f32(f32(θ))) }
  60. @(require_results) cos_f64le :: proc "contextless" (θ: f64le) -> f64le { return #force_inline f64le(cos_f64(f64(θ))) }
  61. @(require_results) cos_f64be :: proc "contextless" (θ: f64be) -> f64be { return #force_inline f64be(cos_f64(f64(θ))) }
  62. cos :: proc{
  63. cos_f16, cos_f16le, cos_f16be,
  64. cos_f32, cos_f32le, cos_f32be,
  65. cos_f64, cos_f64le, cos_f64be,
  66. }
  67. @(require_results) pow_f16le :: proc "contextless" (x, power: f16le) -> f16le { return #force_inline f16le(pow_f16(f16(x), f16(power))) }
  68. @(require_results) pow_f16be :: proc "contextless" (x, power: f16be) -> f16be { return #force_inline f16be(pow_f16(f16(x), f16(power))) }
  69. @(require_results) pow_f32le :: proc "contextless" (x, power: f32le) -> f32le { return #force_inline f32le(pow_f32(f32(x), f32(power))) }
  70. @(require_results) pow_f32be :: proc "contextless" (x, power: f32be) -> f32be { return #force_inline f32be(pow_f32(f32(x), f32(power))) }
  71. @(require_results) pow_f64le :: proc "contextless" (x, power: f64le) -> f64le { return #force_inline f64le(pow_f64(f64(x), f64(power))) }
  72. @(require_results) pow_f64be :: proc "contextless" (x, power: f64be) -> f64be { return #force_inline f64be(pow_f64(f64(x), f64(power))) }
  73. pow :: proc{
  74. pow_f16, pow_f16le, pow_f16be,
  75. pow_f32, pow_f32le, pow_f32be,
  76. pow_f64, pow_f64le, pow_f64be,
  77. }
  78. @(require_results) fmuladd_f16le :: proc "contextless" (a, b, c: f16le) -> f16le { return #force_inline f16le(fmuladd_f16(f16(a), f16(b), f16(c))) }
  79. @(require_results) fmuladd_f16be :: proc "contextless" (a, b, c: f16be) -> f16be { return #force_inline f16be(fmuladd_f16(f16(a), f16(b), f16(c))) }
  80. @(require_results) fmuladd_f32le :: proc "contextless" (a, b, c: f32le) -> f32le { return #force_inline f32le(fmuladd_f32(f32(a), f32(b), f32(c))) }
  81. @(require_results) fmuladd_f32be :: proc "contextless" (a, b, c: f32be) -> f32be { return #force_inline f32be(fmuladd_f32(f32(a), f32(b), f32(c))) }
  82. @(require_results) fmuladd_f64le :: proc "contextless" (a, b, c: f64le) -> f64le { return #force_inline f64le(fmuladd_f64(f64(a), f64(b), f64(c))) }
  83. @(require_results) fmuladd_f64be :: proc "contextless" (a, b, c: f64be) -> f64be { return #force_inline f64be(fmuladd_f64(f64(a), f64(b), f64(c))) }
  84. fmuladd :: proc{
  85. fmuladd_f16, fmuladd_f16le, fmuladd_f16be,
  86. fmuladd_f32, fmuladd_f32le, fmuladd_f32be,
  87. fmuladd_f64, fmuladd_f64le, fmuladd_f64be,
  88. }
  89. @(require_results) exp_f16le :: proc "contextless" (x: f16le) -> f16le { return #force_inline f16le(exp_f16(f16(x))) }
  90. @(require_results) exp_f16be :: proc "contextless" (x: f16be) -> f16be { return #force_inline f16be(exp_f16(f16(x))) }
  91. @(require_results) exp_f32le :: proc "contextless" (x: f32le) -> f32le { return #force_inline f32le(exp_f32(f32(x))) }
  92. @(require_results) exp_f32be :: proc "contextless" (x: f32be) -> f32be { return #force_inline f32be(exp_f32(f32(x))) }
  93. @(require_results) exp_f64le :: proc "contextless" (x: f64le) -> f64le { return #force_inline f64le(exp_f64(f64(x))) }
  94. @(require_results) exp_f64be :: proc "contextless" (x: f64be) -> f64be { return #force_inline f64be(exp_f64(f64(x))) }
  95. exp :: proc{
  96. exp_f16, exp_f16le, exp_f16be,
  97. exp_f32, exp_f32le, exp_f32be,
  98. exp_f64, exp_f64le, exp_f64be,
  99. }
  100. @(require_results) pow10_f16le :: proc "contextless" (x: f16le) -> f16le { return #force_inline f16le(pow10_f16(f16(x))) }
  101. @(require_results) pow10_f16be :: proc "contextless" (x: f16be) -> f16be { return #force_inline f16be(pow10_f16(f16(x))) }
  102. @(require_results) pow10_f32le :: proc "contextless" (x: f32le) -> f32le { return #force_inline f32le(pow10_f32(f32(x))) }
  103. @(require_results) pow10_f32be :: proc "contextless" (x: f32be) -> f32be { return #force_inline f32be(pow10_f32(f32(x))) }
  104. @(require_results) pow10_f64le :: proc "contextless" (x: f64le) -> f64le { return #force_inline f64le(pow10_f64(f64(x))) }
  105. @(require_results) pow10_f64be :: proc "contextless" (x: f64be) -> f64be { return #force_inline f64be(pow10_f64(f64(x))) }
  106. pow10 :: proc{
  107. pow10_f16, pow10_f16le, pow10_f16be,
  108. pow10_f32, pow10_f32le, pow10_f32be,
  109. pow10_f64, pow10_f64le, pow10_f64be,
  110. }
  111. @(require_results)
  112. pow10_f16 :: proc "contextless" (n: f16) -> f16 {
  113. @static pow10_pos_tab := [?]f16{
  114. 1e00, 1e01, 1e02, 1e03, 1e04,
  115. }
  116. @static pow10_neg_tab := [?]f16{
  117. 1e-00, 1e-01, 1e-02, 1e-03, 1e-04, 1e-05, 1e-06, 1e-07,
  118. }
  119. if 0 <= n && n <= 4 {
  120. return pow10_pos_tab[uint(n)]
  121. }
  122. if -7 <= n && n <= 0 {
  123. return pow10_neg_tab[uint(-n)]
  124. }
  125. if n > 0 {
  126. return inf_f16(1)
  127. }
  128. return 0
  129. }
  130. @(require_results)
  131. pow10_f32 :: proc "contextless" (n: f32) -> f32 {
  132. @static pow10_pos_tab := [?]f32{
  133. 1e00, 1e01, 1e02, 1e03, 1e04, 1e05, 1e06, 1e07, 1e08, 1e09,
  134. 1e10, 1e11, 1e12, 1e13, 1e14, 1e15, 1e16, 1e17, 1e18, 1e19,
  135. 1e20, 1e21, 1e22, 1e23, 1e24, 1e25, 1e26, 1e27, 1e28, 1e29,
  136. 1e30, 1e31, 1e32, 1e33, 1e34, 1e35, 1e36, 1e37, 1e38,
  137. }
  138. @static pow10_neg_tab := [?]f32{
  139. 1e-00, 1e-01, 1e-02, 1e-03, 1e-04, 1e-05, 1e-06, 1e-07, 1e-08, 1e-09,
  140. 1e-10, 1e-11, 1e-12, 1e-13, 1e-14, 1e-15, 1e-16, 1e-17, 1e-18, 1e-19,
  141. 1e-20, 1e-21, 1e-22, 1e-23, 1e-24, 1e-25, 1e-26, 1e-27, 1e-28, 1e-29,
  142. 1e-30, 1e-31, 1e-32, 1e-33, 1e-34, 1e-35, 1e-36, 1e-37, 1e-38, 1e-39,
  143. 1e-40, 1e-41, 1e-42, 1e-43, 1e-44, 1e-45,
  144. }
  145. if 0 <= n && n <= 38 {
  146. return pow10_pos_tab[uint(n)]
  147. }
  148. if -45 <= n && n <= 0 {
  149. return pow10_neg_tab[uint(-n)]
  150. }
  151. if n > 0 {
  152. return inf_f32(1)
  153. }
  154. return 0
  155. }
  156. @(require_results)
  157. pow10_f64 :: proc "contextless" (n: f64) -> f64 {
  158. @static pow10_tab := [?]f64{
  159. 1e00, 1e01, 1e02, 1e03, 1e04, 1e05, 1e06, 1e07, 1e08, 1e09,
  160. 1e10, 1e11, 1e12, 1e13, 1e14, 1e15, 1e16, 1e17, 1e18, 1e19,
  161. 1e20, 1e21, 1e22, 1e23, 1e24, 1e25, 1e26, 1e27, 1e28, 1e29,
  162. 1e30, 1e31,
  163. }
  164. @static pow10_pos_tab32 := [?]f64{
  165. 1e00, 1e32, 1e64, 1e96, 1e128, 1e160, 1e192, 1e224, 1e256, 1e288,
  166. }
  167. @static pow10_neg_tab32 := [?]f64{
  168. 1e-00, 1e-32, 1e-64, 1e-96, 1e-128, 1e-160, 1e-192, 1e-224, 1e-256, 1e-288, 1e-320,
  169. }
  170. if 0 <= n && n <= 308 {
  171. return pow10_pos_tab32[uint(n)/32] * pow10_tab[uint(n)%32]
  172. }
  173. if -323 <= n && n <= 0 {
  174. return pow10_neg_tab32[uint(-n)/32] / pow10_tab[uint(-n)%32]
  175. }
  176. if n > 0 {
  177. return inf_f64(1)
  178. }
  179. return 0
  180. }
  181. @(require_results)
  182. pow2_f64 :: proc "contextless" (#any_int exp: int) -> (res: f64) {
  183. switch {
  184. case exp >= -1022 && exp <= 1023: // Normal
  185. return transmute(f64)(u64(exp + F64_BIAS) << F64_SHIFT)
  186. case exp < -1075: // Underflow
  187. return f64(0)
  188. case exp == -1075: // Underflow.
  189. // Note that pow(2, -1075) returns 0h1 on Windows and 0h0 on macOS & Linux.
  190. return 0h00000000_00000000
  191. case exp < -1022: // Denormal
  192. x := u64(exp + (F64_SHIFT + 1) + F64_BIAS) << F64_SHIFT
  193. return f64(1) / (1 << (F64_SHIFT + 1)) * transmute(f64)x
  194. case exp > 1023: // Overflow, +Inf
  195. return 0h7ff00000_00000000
  196. }
  197. unreachable()
  198. }
  199. @(require_results)
  200. pow2_f32 :: proc "contextless" (#any_int exp: int) -> (res: f32) {
  201. switch {
  202. case exp >= -126 && exp <= 127: // Normal
  203. return transmute(f32)(u32(exp + F32_BIAS) << F32_SHIFT)
  204. case exp < -151: // Underflow
  205. return f32(0)
  206. case exp < -126: // Denormal
  207. x := u32(exp + (F32_SHIFT + 1) + F32_BIAS) << F32_SHIFT
  208. return f32(1) / (1 << (F32_SHIFT + 1)) * transmute(f32)x
  209. case exp > 127: // Overflow, +Inf
  210. return 0h7f80_0000
  211. }
  212. unreachable()
  213. }
  214. @(require_results)
  215. pow2_f16 :: proc "contextless" (#any_int exp: int) -> (res: f16) {
  216. switch {
  217. case exp >= -14 && exp <= 15: // Normal
  218. return transmute(f16)(u16(exp + F16_BIAS) << F16_SHIFT)
  219. case exp < -25: // Underflow
  220. return 0h0000
  221. case exp == -25: // Underflow
  222. return 0h0001
  223. case exp < -14: // Denormal
  224. x := u16(exp + (F16_SHIFT + 1) + F16_BIAS) << F16_SHIFT
  225. return f16(1) / (1 << (F16_SHIFT + 1)) * transmute(f16)x
  226. case exp > 15: // Overflow, +Inf
  227. return 0h7c00
  228. }
  229. unreachable()
  230. }
  231. @(require_results)
  232. ldexp_f64 :: proc "contextless" (val: f64, exp: int) -> f64 {
  233. mask :: F64_MASK
  234. shift :: F64_SHIFT
  235. bias :: F64_BIAS
  236. switch {
  237. case val == 0:
  238. return val
  239. case is_inf(val) || is_nan(val):
  240. return val
  241. }
  242. exp := exp
  243. frac, e := normalize_f64(val)
  244. exp += e
  245. x := transmute(u64)frac
  246. exp += int(x>>shift)&mask - bias
  247. if exp < -1075 { // underflow
  248. return copy_sign(0, frac)
  249. } else if exp > 1023 { // overflow
  250. if frac < 0 {
  251. return inf_f64(-1)
  252. }
  253. return inf_f64(+1)
  254. }
  255. m: f64 = 1
  256. if exp < -1022 { // denormal
  257. exp += 53
  258. m = 1.0 / (1<<53)
  259. }
  260. x &~= mask << shift
  261. x |= u64(exp+bias) << shift
  262. return m * transmute(f64)x
  263. }
  264. @(require_results) ldexp_f16 :: proc "contextless" (val: f16, exp: int) -> f16 { return f16(ldexp_f64(f64(val), exp)) }
  265. @(require_results) ldexp_f32 :: proc "contextless" (val: f32, exp: int) -> f32 { return f32(ldexp_f64(f64(val), exp)) }
  266. @(require_results) ldexp_f16le :: proc "contextless" (val: f16le, exp: int) -> f16le { return #force_inline f16le(ldexp_f16(f16(val), exp)) }
  267. @(require_results) ldexp_f16be :: proc "contextless" (val: f16be, exp: int) -> f16be { return #force_inline f16be(ldexp_f16(f16(val), exp)) }
  268. @(require_results) ldexp_f32le :: proc "contextless" (val: f32le, exp: int) -> f32le { return #force_inline f32le(ldexp_f32(f32(val), exp)) }
  269. @(require_results) ldexp_f32be :: proc "contextless" (val: f32be, exp: int) -> f32be { return #force_inline f32be(ldexp_f32(f32(val), exp)) }
  270. @(require_results) ldexp_f64le :: proc "contextless" (val: f64le, exp: int) -> f64le { return #force_inline f64le(ldexp_f64(f64(val), exp)) }
  271. @(require_results) ldexp_f64be :: proc "contextless" (val: f64be, exp: int) -> f64be { return #force_inline f64be(ldexp_f64(f64(val), exp)) }
  272. // ldexp is the inverse of frexp
  273. // it returns val * 2**exp.
  274. //
  275. // Special cases:
  276. // ldexp(+0, exp) = +0
  277. // ldexp(-0, exp) = -0
  278. // ldexp(+inf, exp) = +inf
  279. // ldexp(-inf, exp) = -inf
  280. // ldexp(NaN, exp) = NaN
  281. ldexp :: proc{
  282. ldexp_f16, ldexp_f16le, ldexp_f16be,
  283. ldexp_f32, ldexp_f32le, ldexp_f32be,
  284. ldexp_f64, ldexp_f64le, ldexp_f64be,
  285. }
  286. @(require_results) log_f16 :: proc "contextless" (x, base: f16) -> f16 { return ln(x) / ln(base) }
  287. @(require_results) log_f16le :: proc "contextless" (x, base: f16le) -> f16le { return f16le(log_f16(f16(x), f16(base))) }
  288. @(require_results) log_f16be :: proc "contextless" (x, base: f16be) -> f16be { return f16be(log_f16(f16(x), f16(base))) }
  289. @(require_results) log_f32 :: proc "contextless" (x, base: f32) -> f32 { return ln(x) / ln(base) }
  290. @(require_results) log_f32le :: proc "contextless" (x, base: f32le) -> f32le { return f32le(log_f32(f32(x), f32(base))) }
  291. @(require_results) log_f32be :: proc "contextless" (x, base: f32be) -> f32be { return f32be(log_f32(f32(x), f32(base))) }
  292. @(require_results) log_f64 :: proc "contextless" (x, base: f64) -> f64 { return ln(x) / ln(base) }
  293. @(require_results) log_f64le :: proc "contextless" (x, base: f64le) -> f64le { return f64le(log_f64(f64(x), f64(base))) }
  294. @(require_results) log_f64be :: proc "contextless" (x, base: f64be) -> f64be { return f64be(log_f64(f64(x), f64(base))) }
  295. log :: proc{
  296. log_f16, log_f16le, log_f16be,
  297. log_f32, log_f32le, log_f32be,
  298. log_f64, log_f64le, log_f64be,
  299. }
  300. @(require_results) log2_f16 :: proc "contextless" (x: f16) -> f16 { return log(f16(x), f16(2.0)) }
  301. @(require_results) log2_f16le :: proc "contextless" (x: f16le) -> f16le { return f16le(log_f16(f16(x), f16(2.0))) }
  302. @(require_results) log2_f16be :: proc "contextless" (x: f16be) -> f16be { return f16be(log_f16(f16(x), f16(2.0))) }
  303. @(require_results) log2_f32 :: proc "contextless" (x: f32) -> f32 { return log(f32(x), f32(2.0)) }
  304. @(require_results) log2_f32le :: proc "contextless" (x: f32le) -> f32le { return f32le(log_f32(f32(x), f32(2.0))) }
  305. @(require_results) log2_f32be :: proc "contextless" (x: f32be) -> f32be { return f32be(log_f32(f32(x), f32(2.0))) }
  306. @(require_results) log2_f64 :: proc "contextless" (x: f64) -> f64 { return log(f64(x), f64(2.0)) }
  307. @(require_results) log2_f64le :: proc "contextless" (x: f64le) -> f64le { return f64le(log_f64(f64(x), f64(2.0))) }
  308. @(require_results) log2_f64be :: proc "contextless" (x: f64be) -> f64be { return f64be(log_f64(f64(x), f64(2.0))) }
  309. log2 :: proc{
  310. log2_f16, log2_f16le, log2_f16be,
  311. log2_f32, log2_f32le, log2_f32be,
  312. log2_f64, log2_f64le, log2_f64be,
  313. }
  314. @(require_results) log10_f16 :: proc "contextless" (x: f16) -> f16 { return ln(x)/LN10 }
  315. @(require_results) log10_f16le :: proc "contextless" (x: f16le) -> f16le { return f16le(log10_f16(f16(x))) }
  316. @(require_results) log10_f16be :: proc "contextless" (x: f16be) -> f16be { return f16be(log10_f16(f16(x))) }
  317. @(require_results) log10_f32 :: proc "contextless" (x: f32) -> f32 { return ln(x)/LN10 }
  318. @(require_results) log10_f32le :: proc "contextless" (x: f32le) -> f32le { return f32le(log10_f32(f32(x))) }
  319. @(require_results) log10_f32be :: proc "contextless" (x: f32be) -> f32be { return f32be(log10_f32(f32(x))) }
  320. @(require_results) log10_f64 :: proc "contextless" (x: f64) -> f64 { return ln(x)/LN10 }
  321. @(require_results) log10_f64le :: proc "contextless" (x: f64le) -> f64le { return f64le(log10_f64(f64(x))) }
  322. @(require_results) log10_f64be :: proc "contextless" (x: f64be) -> f64be { return f64be(log10_f64(f64(x))) }
  323. log10 :: proc{
  324. log10_f16, log10_f16le, log10_f16be,
  325. log10_f32, log10_f32le, log10_f32be,
  326. log10_f64, log10_f64le, log10_f64be,
  327. }
  328. @(require_results) tan_f16 :: proc "contextless" (θ: f16) -> f16 { return sin(θ)/cos(θ) }
  329. @(require_results) tan_f16le :: proc "contextless" (θ: f16le) -> f16le { return f16le(tan_f16(f16(θ))) }
  330. @(require_results) tan_f16be :: proc "contextless" (θ: f16be) -> f16be { return f16be(tan_f16(f16(θ))) }
  331. @(require_results) tan_f32 :: proc "contextless" (θ: f32) -> f32 { return sin(θ)/cos(θ) }
  332. @(require_results) tan_f32le :: proc "contextless" (θ: f32le) -> f32le { return f32le(tan_f32(f32(θ))) }
  333. @(require_results) tan_f32be :: proc "contextless" (θ: f32be) -> f32be { return f32be(tan_f32(f32(θ))) }
  334. @(require_results) tan_f64 :: proc "contextless" (θ: f64) -> f64 { return sin(θ)/cos(θ) }
  335. @(require_results) tan_f64le :: proc "contextless" (θ: f64le) -> f64le { return f64le(tan_f64(f64(θ))) }
  336. @(require_results) tan_f64be :: proc "contextless" (θ: f64be) -> f64be { return f64be(tan_f64(f64(θ))) }
  337. tan :: proc{
  338. tan_f16, tan_f16le, tan_f16be,
  339. tan_f32, tan_f32le, tan_f32be,
  340. tan_f64, tan_f64le, tan_f64be,
  341. }
  342. @(require_results) lerp :: proc "contextless" (a, b: $T, t: $E) -> (x: T) { return a*(1-t) + b*t }
  343. @(require_results) saturate :: proc "contextless" (a: $T) -> (x: T) { return clamp(a, 0, 1) }
  344. @(require_results)
  345. unlerp :: proc "contextless" (a, b, x: $T) -> (t: T) where intrinsics.type_is_float(T), !intrinsics.type_is_array(T) {
  346. return (x-a)/(b-a)
  347. }
  348. @(require_results)
  349. remap :: proc "contextless" (old_value, old_min, old_max, new_min, new_max: $T) -> (x: T) where intrinsics.type_is_numeric(T), !intrinsics.type_is_array(T) {
  350. old_range := old_max - old_min
  351. new_range := new_max - new_min
  352. if old_range == 0 {
  353. return new_range / 2
  354. }
  355. return ((old_value - old_min) / old_range) * new_range + new_min
  356. }
  357. @(require_results)
  358. wrap :: proc "contextless" (x, y: $T) -> T where intrinsics.type_is_numeric(T), !intrinsics.type_is_array(T) {
  359. tmp := mod(x, y)
  360. return y + tmp if tmp < 0 else tmp
  361. }
  362. @(require_results)
  363. angle_diff :: proc "contextless" (a, b: $T) -> T where intrinsics.type_is_numeric(T), !intrinsics.type_is_array(T) {
  364. dist := wrap(b - a, TAU)
  365. return wrap(dist*2, TAU) - dist
  366. }
  367. @(require_results)
  368. angle_lerp :: proc "contextless" (a, b, t: $T) -> T where intrinsics.type_is_numeric(T), !intrinsics.type_is_array(T) {
  369. return a + angle_diff(a, b) * t
  370. }
  371. @(require_results)
  372. step :: proc "contextless" (edge, x: $T) -> T where intrinsics.type_is_numeric(T), !intrinsics.type_is_array(T) {
  373. return 0 if x < edge else 1
  374. }
  375. @(require_results)
  376. smoothstep :: proc "contextless" (edge0, edge1, x: $T) -> T where intrinsics.type_is_numeric(T), !intrinsics.type_is_array(T) {
  377. t := clamp((x - edge0) / (edge1 - edge0), 0, 1)
  378. return t * t * (3 - 2*t)
  379. }
  380. @(require_results)
  381. bias :: proc "contextless" (t, b: $T) -> T where intrinsics.type_is_numeric(T) {
  382. return t / (((1/b) - 2) * (1 - t) + 1)
  383. }
  384. @(require_results)
  385. gain :: proc "contextless" (t, g: $T) -> T where intrinsics.type_is_numeric(T) {
  386. if t < 0.5 {
  387. return bias(t*2, g)*0.5
  388. }
  389. return bias(t*2 - 1, 1 - g)*0.5 + 0.5
  390. }
  391. @(require_results) sign_f16 :: proc "contextless" (x: f16) -> f16 { return f16(int(0 < x) - int(x < 0)) }
  392. @(require_results) sign_f16le :: proc "contextless" (x: f16le) -> f16le { return f16le(int(0 < x) - int(x < 0)) }
  393. @(require_results) sign_f16be :: proc "contextless" (x: f16be) -> f16be { return f16be(int(0 < x) - int(x < 0)) }
  394. @(require_results) sign_f32 :: proc "contextless" (x: f32) -> f32 { return f32(int(0 < x) - int(x < 0)) }
  395. @(require_results) sign_f32le :: proc "contextless" (x: f32le) -> f32le { return f32le(int(0 < x) - int(x < 0)) }
  396. @(require_results) sign_f32be :: proc "contextless" (x: f32be) -> f32be { return f32be(int(0 < x) - int(x < 0)) }
  397. @(require_results) sign_f64 :: proc "contextless" (x: f64) -> f64 { return f64(int(0 < x) - int(x < 0)) }
  398. @(require_results) sign_f64le :: proc "contextless" (x: f64le) -> f64le { return f64le(int(0 < x) - int(x < 0)) }
  399. @(require_results) sign_f64be :: proc "contextless" (x: f64be) -> f64be { return f64be(int(0 < x) - int(x < 0)) }
  400. sign :: proc{
  401. sign_f16, sign_f16le, sign_f16be,
  402. sign_f32, sign_f32le, sign_f32be,
  403. sign_f64, sign_f64le, sign_f64be,
  404. }
  405. @(require_results) sign_bit_f16 :: proc "contextless" (x: f16) -> bool { return (transmute(u16)x) & (1<<15) != 0 }
  406. @(require_results) sign_bit_f16le :: proc "contextless" (x: f16le) -> bool { return #force_inline sign_bit_f16(f16(x)) }
  407. @(require_results) sign_bit_f16be :: proc "contextless" (x: f16be) -> bool { return #force_inline sign_bit_f16(f16(x)) }
  408. @(require_results) sign_bit_f32 :: proc "contextless" (x: f32) -> bool { return (transmute(u32)x) & (1<<31) != 0 }
  409. @(require_results) sign_bit_f32le :: proc "contextless" (x: f32le) -> bool { return #force_inline sign_bit_f32(f32(x)) }
  410. @(require_results) sign_bit_f32be :: proc "contextless" (x: f32be) -> bool { return #force_inline sign_bit_f32(f32(x)) }
  411. @(require_results) sign_bit_f64 :: proc "contextless" (x: f64) -> bool { return (transmute(u64)x) & (1<<63) != 0 }
  412. @(require_results) sign_bit_f64le :: proc "contextless" (x: f64le) -> bool { return #force_inline sign_bit_f64(f64(x)) }
  413. @(require_results) sign_bit_f64be :: proc "contextless" (x: f64be) -> bool { return #force_inline sign_bit_f64(f64(x)) }
  414. sign_bit :: proc{
  415. sign_bit_f16, sign_bit_f16le, sign_bit_f16be,
  416. sign_bit_f32, sign_bit_f32le, sign_bit_f32be,
  417. sign_bit_f64, sign_bit_f64le, sign_bit_f64be,
  418. }
  419. @(require_results)
  420. copy_sign_f16 :: proc "contextless" (x, y: f16) -> f16 {
  421. ix := transmute(u16)x
  422. iy := transmute(u16)y
  423. ix &= 0x7fff
  424. ix |= iy & 0x8000
  425. return transmute(f16)ix
  426. }
  427. @(require_results) copy_sign_f16le :: proc "contextless" (x, y: f16le) -> f16le { return #force_inline f16le(copy_sign_f16(f16(x), f16(y))) }
  428. @(require_results) copy_sign_f16be :: proc "contextless" (x, y: f16be) -> f16be { return #force_inline f16be(copy_sign_f16(f16(x), f16(y))) }
  429. @(require_results)
  430. copy_sign_f32 :: proc "contextless" (x, y: f32) -> f32 {
  431. ix := transmute(u32)x
  432. iy := transmute(u32)y
  433. ix &= 0x7fff_ffff
  434. ix |= iy & 0x8000_0000
  435. return transmute(f32)ix
  436. }
  437. @(require_results) copy_sign_f32le :: proc "contextless" (x, y: f32le) -> f32le { return #force_inline f32le(copy_sign_f32(f32(x), f32(y))) }
  438. @(require_results) copy_sign_f32be :: proc "contextless" (x, y: f32be) -> f32be { return #force_inline f32be(copy_sign_f32(f32(x), f32(y))) }
  439. @(require_results)
  440. copy_sign_f64 :: proc "contextless" (x, y: f64) -> f64 {
  441. ix := transmute(u64)x
  442. iy := transmute(u64)y
  443. ix &= 0x7fff_ffff_ffff_ffff
  444. ix |= iy & 0x8000_0000_0000_0000
  445. return transmute(f64)ix
  446. }
  447. @(require_results) copy_sign_f64le :: proc "contextless" (x, y: f64le) -> f64le { return #force_inline f64le(copy_sign_f64(f64(x), f64(y))) }
  448. @(require_results) copy_sign_f64be :: proc "contextless" (x, y: f64be) -> f64be { return #force_inline f64be(copy_sign_f64(f64(x), f64(y))) }
  449. copy_sign :: proc{
  450. copy_sign_f16, copy_sign_f16le, copy_sign_f16be,
  451. copy_sign_f32, copy_sign_f32le, copy_sign_f32be,
  452. copy_sign_f64, copy_sign_f64le, copy_sign_f64be,
  453. }
  454. @(require_results) to_radians_f16 :: proc "contextless" (degrees: f16) -> f16 { return degrees * RAD_PER_DEG }
  455. @(require_results) to_radians_f16le :: proc "contextless" (degrees: f16le) -> f16le { return degrees * RAD_PER_DEG }
  456. @(require_results) to_radians_f16be :: proc "contextless" (degrees: f16be) -> f16be { return degrees * RAD_PER_DEG }
  457. @(require_results) to_radians_f32 :: proc "contextless" (degrees: f32) -> f32 { return degrees * RAD_PER_DEG }
  458. @(require_results) to_radians_f32le :: proc "contextless" (degrees: f32le) -> f32le { return degrees * RAD_PER_DEG }
  459. @(require_results) to_radians_f32be :: proc "contextless" (degrees: f32be) -> f32be { return degrees * RAD_PER_DEG }
  460. @(require_results) to_radians_f64 :: proc "contextless" (degrees: f64) -> f64 { return degrees * RAD_PER_DEG }
  461. @(require_results) to_radians_f64le :: proc "contextless" (degrees: f64le) -> f64le { return degrees * RAD_PER_DEG }
  462. @(require_results) to_radians_f64be :: proc "contextless" (degrees: f64be) -> f64be { return degrees * RAD_PER_DEG }
  463. @(require_results) to_degrees_f16 :: proc "contextless" (radians: f16) -> f16 { return radians * DEG_PER_RAD }
  464. @(require_results) to_degrees_f16le :: proc "contextless" (radians: f16le) -> f16le { return radians * DEG_PER_RAD }
  465. @(require_results) to_degrees_f16be :: proc "contextless" (radians: f16be) -> f16be { return radians * DEG_PER_RAD }
  466. @(require_results) to_degrees_f32 :: proc "contextless" (radians: f32) -> f32 { return radians * DEG_PER_RAD }
  467. @(require_results) to_degrees_f32le :: proc "contextless" (radians: f32le) -> f32le { return radians * DEG_PER_RAD }
  468. @(require_results) to_degrees_f32be :: proc "contextless" (radians: f32be) -> f32be { return radians * DEG_PER_RAD }
  469. @(require_results) to_degrees_f64 :: proc "contextless" (radians: f64) -> f64 { return radians * DEG_PER_RAD }
  470. @(require_results) to_degrees_f64le :: proc "contextless" (radians: f64le) -> f64le { return radians * DEG_PER_RAD }
  471. @(require_results) to_degrees_f64be :: proc "contextless" (radians: f64be) -> f64be { return radians * DEG_PER_RAD }
  472. to_radians :: proc{
  473. to_radians_f16, to_radians_f16le, to_radians_f16be,
  474. to_radians_f32, to_radians_f32le, to_radians_f32be,
  475. to_radians_f64, to_radians_f64le, to_radians_f64be,
  476. }
  477. to_degrees :: proc{
  478. to_degrees_f16, to_degrees_f16le, to_degrees_f16be,
  479. to_degrees_f32, to_degrees_f32le, to_degrees_f32be,
  480. to_degrees_f64, to_degrees_f64le, to_degrees_f64be,
  481. }
  482. @(require_results)
  483. trunc_f16 :: proc "contextless" (x: f16) -> f16 {
  484. trunc_internal :: proc "contextless" (f: f16) -> f16 {
  485. mask :: F16_MASK
  486. shift :: F16_SHIFT
  487. bias :: F16_BIAS
  488. if f < 1 {
  489. switch {
  490. case f < 0: return -trunc_internal(-f)
  491. case f == 0: return f
  492. case: return 0
  493. }
  494. }
  495. x := transmute(u16)f
  496. e := (x >> shift) & mask - bias
  497. if e < shift {
  498. x &~= 1 << (shift-e) - 1
  499. }
  500. return transmute(f16)x
  501. }
  502. switch classify(x) {
  503. case .Zero, .Neg_Zero, .NaN, .Inf, .Neg_Inf:
  504. return x
  505. case .Normal, .Subnormal: // carry on
  506. }
  507. return trunc_internal(x)
  508. }
  509. @(require_results) trunc_f16le :: proc "contextless" (x: f16le) -> f16le { return #force_inline f16le(trunc_f16(f16(x))) }
  510. @(require_results) trunc_f16be :: proc "contextless" (x: f16be) -> f16be { return #force_inline f16be(trunc_f16(f16(x))) }
  511. @(require_results)
  512. trunc_f32 :: proc "contextless" (x: f32) -> f32 {
  513. trunc_internal :: proc "contextless" (f: f32) -> f32 {
  514. mask :: F32_MASK
  515. shift :: F32_SHIFT
  516. bias :: F32_BIAS
  517. if f < 1 {
  518. switch {
  519. case f < 0: return -trunc_internal(-f)
  520. case f == 0: return f
  521. case: return 0
  522. }
  523. }
  524. x := transmute(u32)f
  525. e := (x >> shift) & mask - bias
  526. if e < shift {
  527. x &~= 1 << (shift-e) - 1
  528. }
  529. return transmute(f32)x
  530. }
  531. switch classify(x) {
  532. case .Zero, .Neg_Zero, .NaN, .Inf, .Neg_Inf:
  533. return x
  534. case .Normal, .Subnormal: // carry on
  535. }
  536. return trunc_internal(x)
  537. }
  538. @(require_results) trunc_f32le :: proc "contextless" (x: f32le) -> f32le { return #force_inline f32le(trunc_f32(f32(x))) }
  539. @(require_results) trunc_f32be :: proc "contextless" (x: f32be) -> f32be { return #force_inline f32be(trunc_f32(f32(x))) }
  540. @(require_results)
  541. trunc_f64 :: proc "contextless" (x: f64) -> f64 {
  542. trunc_internal :: proc "contextless" (f: f64) -> f64 {
  543. mask :: F64_MASK
  544. shift :: F64_SHIFT
  545. bias :: F64_BIAS
  546. if f < 1 {
  547. switch {
  548. case f < 0: return -trunc_internal(-f)
  549. case f == 0: return f
  550. case: return 0
  551. }
  552. }
  553. x := transmute(u64)f
  554. e := (x >> shift) & mask - bias
  555. if e < shift {
  556. x &~= 1 << (shift-e) - 1
  557. }
  558. return transmute(f64)x
  559. }
  560. switch classify(x) {
  561. case .Zero, .Neg_Zero, .NaN, .Inf, .Neg_Inf:
  562. return x
  563. case .Normal, .Subnormal: // carry on
  564. }
  565. return trunc_internal(x)
  566. }
  567. @(require_results) trunc_f64le :: proc "contextless" (x: f64le) -> f64le { return #force_inline f64le(trunc_f64(f64(x))) }
  568. @(require_results) trunc_f64be :: proc "contextless" (x: f64be) -> f64be { return #force_inline f64be(trunc_f64(f64(x))) }
  569. // Removes the fractional part of the value, i.e. rounds towards zero.
  570. trunc :: proc{
  571. trunc_f16, trunc_f16le, trunc_f16be,
  572. trunc_f32, trunc_f32le, trunc_f32be,
  573. trunc_f64, trunc_f64le, trunc_f64be,
  574. }
  575. @(require_results)
  576. round_f16 :: proc "contextless" (x: f16) -> f16 {
  577. return ceil(x - 0.5) if x < 0 else floor(x + 0.5)
  578. }
  579. @(require_results)
  580. round_f16le :: proc "contextless" (x: f16le) -> f16le {
  581. return ceil(x - 0.5) if x < 0 else floor(x + 0.5)
  582. }
  583. @(require_results)
  584. round_f16be :: proc "contextless" (x: f16be) -> f16be {
  585. return ceil(x - 0.5) if x < 0 else floor(x + 0.5)
  586. }
  587. @(require_results)
  588. round_f32 :: proc "contextless" (x: f32) -> f32 {
  589. return ceil(x - 0.5) if x < 0 else floor(x + 0.5)
  590. }
  591. @(require_results)
  592. round_f32le :: proc "contextless" (x: f32le) -> f32le {
  593. return ceil(x - 0.5) if x < 0 else floor(x + 0.5)
  594. }
  595. @(require_results)
  596. round_f32be :: proc "contextless" (x: f32be) -> f32be {
  597. return ceil(x - 0.5) if x < 0 else floor(x + 0.5)
  598. }
  599. @(require_results)
  600. round_f64 :: proc "contextless" (x: f64) -> f64 {
  601. return ceil(x - 0.5) if x < 0 else floor(x + 0.5)
  602. }
  603. @(require_results)
  604. round_f64le :: proc "contextless" (x: f64le) -> f64le {
  605. return ceil(x - 0.5) if x < 0 else floor(x + 0.5)
  606. }
  607. @(require_results)
  608. round_f64be :: proc "contextless" (x: f64be) -> f64be {
  609. return ceil(x - 0.5) if x < 0 else floor(x + 0.5)
  610. }
  611. round :: proc{
  612. round_f16, round_f16le, round_f16be,
  613. round_f32, round_f32le, round_f32be,
  614. round_f64, round_f64le, round_f64be,
  615. }
  616. @(require_results) ceil_f16 :: proc "contextless" (x: f16) -> f16 { return -floor(-x) }
  617. @(require_results) ceil_f16le :: proc "contextless" (x: f16le) -> f16le { return -floor(-x) }
  618. @(require_results) ceil_f16be :: proc "contextless" (x: f16be) -> f16be { return -floor(-x) }
  619. @(require_results) ceil_f32 :: proc "contextless" (x: f32) -> f32 { return -floor(-x) }
  620. @(require_results) ceil_f32le :: proc "contextless" (x: f32le) -> f32le { return -floor(-x) }
  621. @(require_results) ceil_f32be :: proc "contextless" (x: f32be) -> f32be { return -floor(-x) }
  622. @(require_results) ceil_f64 :: proc "contextless" (x: f64) -> f64 { return -floor(-x) }
  623. @(require_results) ceil_f64le :: proc "contextless" (x: f64le) -> f64le { return -floor(-x) }
  624. @(require_results) ceil_f64be :: proc "contextless" (x: f64be) -> f64be { return -floor(-x) }
  625. ceil :: proc{
  626. ceil_f16, ceil_f16le, ceil_f16be,
  627. ceil_f32, ceil_f32le, ceil_f32be,
  628. ceil_f64, ceil_f64le, ceil_f64be,
  629. }
  630. @(require_results)
  631. floor_f16 :: proc "contextless" (x: f16) -> f16 {
  632. if x == 0 || is_nan(x) || is_inf(x) {
  633. return x
  634. }
  635. if x < 0 {
  636. d, fract := modf(-x)
  637. if fract != 0.0 {
  638. d = d + 1
  639. }
  640. return -d
  641. }
  642. d, _ := modf(x)
  643. return d
  644. }
  645. @(require_results) floor_f16le :: proc "contextless" (x: f16le) -> f16le { return #force_inline f16le(floor_f16(f16(x))) }
  646. @(require_results) floor_f16be :: proc "contextless" (x: f16be) -> f16be { return #force_inline f16be(floor_f16(f16(x))) }
  647. @(require_results)
  648. floor_f32 :: proc "contextless" (x: f32) -> f32 {
  649. if x == 0 || is_nan(x) || is_inf(x) {
  650. return x
  651. }
  652. if x < 0 {
  653. d, fract := modf(-x)
  654. if fract != 0.0 {
  655. d = d + 1
  656. }
  657. return -d
  658. }
  659. d, _ := modf(x)
  660. return d
  661. }
  662. @(require_results) floor_f32le :: proc "contextless" (x: f32le) -> f32le { return #force_inline f32le(floor_f32(f32(x))) }
  663. @(require_results) floor_f32be :: proc "contextless" (x: f32be) -> f32be { return #force_inline f32be(floor_f32(f32(x))) }
  664. @(require_results)
  665. floor_f64 :: proc "contextless" (x: f64) -> f64 {
  666. if x == 0 || is_nan(x) || is_inf(x) {
  667. return x
  668. }
  669. if x < 0 {
  670. d, fract := modf(-x)
  671. if fract != 0.0 {
  672. d = d + 1
  673. }
  674. return -d
  675. }
  676. d, _ := modf(x)
  677. return d
  678. }
  679. @(require_results) floor_f64le :: proc "contextless" (x: f64le) -> f64le { return #force_inline f64le(floor_f64(f64(x))) }
  680. @(require_results) floor_f64be :: proc "contextless" (x: f64be) -> f64be { return #force_inline f64be(floor_f64(f64(x))) }
  681. floor :: proc{
  682. floor_f16, floor_f16le, floor_f16be,
  683. floor_f32, floor_f32le, floor_f32be,
  684. floor_f64, floor_f64le, floor_f64be,
  685. }
  686. @(require_results)
  687. floor_div :: proc "contextless" (x, y: $T) -> T
  688. where intrinsics.type_is_integer(T) {
  689. a := x / y
  690. r := x % y
  691. if (r > 0 && y < 0) || (r < 0 && y > 0) {
  692. a -= 1
  693. }
  694. return a
  695. }
  696. @(require_results)
  697. floor_mod :: proc "contextless" (x, y: $T) -> T
  698. where intrinsics.type_is_integer(T) {
  699. r := x % y
  700. if (r > 0 && y < 0) || (r < 0 && y > 0) {
  701. r += y
  702. }
  703. return r
  704. }
  705. @(require_results)
  706. divmod :: #force_inline proc "contextless" (x, y: $T) -> (div, mod: T)
  707. where intrinsics.type_is_integer(T) {
  708. div = x / y
  709. mod = x % y
  710. return
  711. }
  712. @(require_results)
  713. floor_divmod :: #force_inline proc "contextless" (x, y: $T) -> (div, mod: T)
  714. where intrinsics.type_is_integer(T) {
  715. div = x / y
  716. mod = x % y
  717. if (div > 0 && y < 0) || (mod < 0 && y > 0) {
  718. div -= 1
  719. mod += y
  720. }
  721. return
  722. }
  723. @(require_results)
  724. modf_f16 :: proc "contextless" (x: f16) -> (int: f16, frac: f16) {
  725. shift :: F16_SHIFT
  726. mask :: F16_MASK
  727. bias :: F16_BIAS
  728. if x < 1 {
  729. switch {
  730. case x < 0:
  731. int, frac = modf(-x)
  732. return -int, -frac
  733. case x == 0:
  734. return x, x
  735. }
  736. return 0, x
  737. }
  738. i := transmute(u16)x
  739. e := uint(i>>shift)&mask - bias
  740. if e < shift {
  741. i &~= 1<<(shift-e) - 1
  742. }
  743. int = transmute(f16)i
  744. frac = x - int
  745. return
  746. }
  747. @(require_results)
  748. modf_f16le :: proc "contextless" (x: f16le) -> (int: f16le, frac: f16le) {
  749. i, f := #force_inline modf_f16(f16(x))
  750. return f16le(i), f16le(f)
  751. }
  752. @(require_results)
  753. modf_f16be :: proc "contextless" (x: f16be) -> (int: f16be, frac: f16be) {
  754. i, f := #force_inline modf_f16(f16(x))
  755. return f16be(i), f16be(f)
  756. }
  757. @(require_results)
  758. modf_f32 :: proc "contextless" (x: f32) -> (int: f32, frac: f32) {
  759. shift :: F32_SHIFT
  760. mask :: F32_MASK
  761. bias :: F32_BIAS
  762. if x < 1 {
  763. switch {
  764. case x < 0:
  765. int, frac = modf(-x)
  766. return -int, -frac
  767. case x == 0:
  768. return x, x
  769. }
  770. return 0, x
  771. }
  772. i := transmute(u32)x
  773. e := uint(i>>shift)&mask - bias
  774. if e < shift {
  775. i &~= 1<<(shift-e) - 1
  776. }
  777. int = transmute(f32)i
  778. frac = x - int
  779. return
  780. }
  781. @(require_results)
  782. modf_f32le :: proc "contextless" (x: f32le) -> (int: f32le, frac: f32le) {
  783. i, f := #force_inline modf_f32(f32(x))
  784. return f32le(i), f32le(f)
  785. }
  786. @(require_results)
  787. modf_f32be :: proc "contextless" (x: f32be) -> (int: f32be, frac: f32be) {
  788. i, f := #force_inline modf_f32(f32(x))
  789. return f32be(i), f32be(f)
  790. }
  791. @(require_results)
  792. modf_f64 :: proc "contextless" (x: f64) -> (int: f64, frac: f64) {
  793. shift :: F64_SHIFT
  794. mask :: F64_MASK
  795. bias :: F64_BIAS
  796. if x < 1 {
  797. switch {
  798. case x < 0:
  799. int, frac = modf(-x)
  800. return -int, -frac
  801. case x == 0:
  802. return x, x
  803. }
  804. return 0, x
  805. }
  806. i := transmute(u64)x
  807. e := uint(i>>shift)&mask - bias
  808. if e < shift {
  809. i &~= 1<<(shift-e) - 1
  810. }
  811. int = transmute(f64)i
  812. frac = x - int
  813. return
  814. }
  815. @(require_results)
  816. modf_f64le :: proc "contextless" (x: f64le) -> (int: f64le, frac: f64le) {
  817. i, f := #force_inline modf_f64(f64(x))
  818. return f64le(i), f64le(f)
  819. }
  820. @(require_results)
  821. modf_f64be :: proc "contextless" (x: f64be) -> (int: f64be, frac: f64be) {
  822. i, f := #force_inline modf_f64(f64(x))
  823. return f64be(i), f64be(f)
  824. }
  825. modf :: proc{
  826. modf_f16, modf_f16le, modf_f16be,
  827. modf_f32, modf_f32le, modf_f32be,
  828. modf_f64, modf_f64le, modf_f64be,
  829. }
  830. split_decimal :: modf
  831. @(require_results)
  832. mod_f16 :: proc "contextless" (x, y: f16) -> (n: f16) {
  833. z := abs(y)
  834. n = remainder(abs(x), z)
  835. if sign(n) < 0 {
  836. n += z
  837. }
  838. return copy_sign(n, x)
  839. }
  840. @(require_results) mod_f16le :: proc "contextless" (x, y: f16le) -> (n: f16le) { return #force_inline f16le(mod_f16(f16(x), f16(y))) }
  841. @(require_results) mod_f16be :: proc "contextless" (x, y: f16be) -> (n: f16be) { return #force_inline f16be(mod_f16(f16(x), f16(y))) }
  842. @(require_results)
  843. mod_f32 :: proc "contextless" (x, y: f32) -> (n: f32) {
  844. z := abs(y)
  845. n = remainder(abs(x), z)
  846. if sign(n) < 0 {
  847. n += z
  848. }
  849. return copy_sign(n, x)
  850. }
  851. @(require_results)
  852. mod_f32le :: proc "contextless" (x, y: f32le) -> (n: f32le) { return #force_inline f32le(mod_f32(f32(x), f32(y))) }
  853. @(require_results)
  854. mod_f32be :: proc "contextless" (x, y: f32be) -> (n: f32be) { return #force_inline f32be(mod_f32(f32(x), f32(y))) }
  855. @(require_results)
  856. mod_f64 :: proc "contextless" (x, y: f64) -> (n: f64) {
  857. z := abs(y)
  858. n = remainder(abs(x), z)
  859. if sign(n) < 0 {
  860. n += z
  861. }
  862. return copy_sign(n, x)
  863. }
  864. @(require_results)
  865. mod_f64le :: proc "contextless" (x, y: f64le) -> (n: f64le) { return #force_inline f64le(mod_f64(f64(x), f64(y))) }
  866. @(require_results)
  867. mod_f64be :: proc "contextless" (x, y: f64be) -> (n: f64be) { return #force_inline f64be(mod_f64(f64(x), f64(y))) }
  868. mod :: proc{
  869. mod_f16, mod_f16le, mod_f16be,
  870. mod_f32, mod_f32le, mod_f32be,
  871. mod_f64, mod_f64le, mod_f64be,
  872. }
  873. @(require_results) remainder_f16 :: proc "contextless" (x, y: f16 ) -> f16 { return x - round(x/y) * y }
  874. @(require_results) remainder_f16le :: proc "contextless" (x, y: f16le) -> f16le { return x - round(x/y) * y }
  875. @(require_results) remainder_f16be :: proc "contextless" (x, y: f16be) -> f16be { return x - round(x/y) * y }
  876. @(require_results) remainder_f32 :: proc "contextless" (x, y: f32 ) -> f32 { return x - round(x/y) * y }
  877. @(require_results) remainder_f32le :: proc "contextless" (x, y: f32le) -> f32le { return x - round(x/y) * y }
  878. @(require_results) remainder_f32be :: proc "contextless" (x, y: f32be) -> f32be { return x - round(x/y) * y }
  879. @(require_results) remainder_f64 :: proc "contextless" (x, y: f64 ) -> f64 { return x - round(x/y) * y }
  880. @(require_results) remainder_f64le :: proc "contextless" (x, y: f64le) -> f64le { return x - round(x/y) * y }
  881. @(require_results) remainder_f64be :: proc "contextless" (x, y: f64be) -> f64be { return x - round(x/y) * y }
  882. remainder :: proc{
  883. remainder_f16, remainder_f16le, remainder_f16be,
  884. remainder_f32, remainder_f32le, remainder_f32be,
  885. remainder_f64, remainder_f64le, remainder_f64be,
  886. }
  887. @(require_results)
  888. gcd :: proc "contextless" (x, y: $T) -> T
  889. where intrinsics.type_is_ordered_numeric(T) {
  890. x, y := x, y
  891. for y != 0 {
  892. x %= y
  893. x, y = y, x
  894. }
  895. return abs(x)
  896. }
  897. @(require_results)
  898. lcm :: proc "contextless" (x, y: $T) -> T
  899. where intrinsics.type_is_ordered_numeric(T) {
  900. return x / gcd(x, y) * y
  901. }
  902. @(require_results)
  903. normalize_f16 :: proc "contextless" (x: f16) -> (y: f16, exponent: int) {
  904. if abs(x) < F16_MIN {
  905. return x * (1<<F16_SHIFT), -F16_SHIFT
  906. }
  907. return x, 0
  908. }
  909. @(require_results)
  910. normalize_f32 :: proc "contextless" (x: f32) -> (y: f32, exponent: int) {
  911. if abs(x) < F32_MIN {
  912. return x * (1<<F32_SHIFT), -F32_SHIFT
  913. }
  914. return x, 0
  915. }
  916. @(require_results)
  917. normalize_f64 :: proc "contextless" (x: f64) -> (y: f64, exponent: int) {
  918. if abs(x) < F64_MIN {
  919. return x * (1<<F64_SHIFT), -F64_SHIFT
  920. }
  921. return x, 0
  922. }
  923. @(require_results) normalize_f16le :: proc "contextless" (x: f16le) -> (y: f16le, exponent: int) { y0, e := normalize_f16(f16(x)); return f16le(y0), e }
  924. @(require_results) normalize_f16be :: proc "contextless" (x: f16be) -> (y: f16be, exponent: int) { y0, e := normalize_f16(f16(x)); return f16be(y0), e }
  925. @(require_results) normalize_f32le :: proc "contextless" (x: f32le) -> (y: f32le, exponent: int) { y0, e := normalize_f32(f32(x)); return f32le(y0), e }
  926. @(require_results) normalize_f32be :: proc "contextless" (x: f32be) -> (y: f32be, exponent: int) { y0, e := normalize_f32(f32(x)); return f32be(y0), e }
  927. @(require_results) normalize_f64le :: proc "contextless" (x: f64le) -> (y: f64le, exponent: int) { y0, e := normalize_f64(f64(x)); return f64le(y0), e }
  928. @(require_results) normalize_f64be :: proc "contextless" (x: f64be) -> (y: f64be, exponent: int) { y0, e := normalize_f64(f64(x)); return f64be(y0), e }
  929. normalize :: proc{
  930. normalize_f16,
  931. normalize_f32,
  932. normalize_f64,
  933. normalize_f16le,
  934. normalize_f16be,
  935. normalize_f32le,
  936. normalize_f32be,
  937. normalize_f64le,
  938. normalize_f64be,
  939. }
  940. @(require_results)
  941. frexp_f16 :: proc "contextless" (x: f16) -> (significand: f16, exponent: int) {
  942. f, e := frexp_f64(f64(x))
  943. return f16(f), e
  944. }
  945. @(require_results)
  946. frexp_f16le :: proc "contextless" (x: f16le) -> (significand: f16le, exponent: int) {
  947. f, e := frexp_f64(f64(x))
  948. return f16le(f), e
  949. }
  950. @(require_results)
  951. frexp_f16be :: proc "contextless" (x: f16be) -> (significand: f16be, exponent: int) {
  952. f, e := frexp_f64(f64(x))
  953. return f16be(f), e
  954. }
  955. @(require_results)
  956. frexp_f32 :: proc "contextless" (x: f32) -> (significand: f32, exponent: int) {
  957. f, e := frexp_f64(f64(x))
  958. return f32(f), e
  959. }
  960. @(require_results)
  961. frexp_f32le :: proc "contextless" (x: f32le) -> (significand: f32le, exponent: int) {
  962. f, e := frexp_f64(f64(x))
  963. return f32le(f), e
  964. }
  965. @(require_results)
  966. frexp_f32be :: proc "contextless" (x: f32be) -> (significand: f32be, exponent: int) {
  967. f, e := frexp_f64(f64(x))
  968. return f32be(f), e
  969. }
  970. @(require_results)
  971. frexp_f64 :: proc "contextless" (f: f64) -> (significand: f64, exponent: int) {
  972. mask :: F64_MASK
  973. shift :: F64_SHIFT
  974. bias :: F64_BIAS
  975. switch {
  976. case f == 0:
  977. return 0, 0
  978. case is_inf(f) || is_nan(f):
  979. return f, 0
  980. }
  981. f := f
  982. f, exponent = normalize_f64(f)
  983. x := transmute(u64)f
  984. exponent += int((x>>shift)&mask) - bias + 1
  985. x &~= mask << shift
  986. x |= (-1 + bias) << shift
  987. significand = transmute(f64)x
  988. return
  989. }
  990. @(require_results)
  991. frexp_f64le :: proc "contextless" (x: f64le) -> (significand: f64le, exponent: int) {
  992. f, e := frexp_f64(f64(x))
  993. return f64le(f), e
  994. }
  995. @(require_results)
  996. frexp_f64be :: proc "contextless" (x: f64be) -> (significand: f64be, exponent: int) {
  997. f, e := frexp_f64(f64(x))
  998. return f64be(f), e
  999. }
  1000. // frexp breaks the value into a normalized fraction, and an integral power of two
  1001. // It returns a significand and exponent satisfying x == significand * 2**exponent
  1002. // with the absolute value of significand in the intervalue of [0.5, 1).
  1003. //
  1004. // Special cases:
  1005. // frexp(+0) = +0, 0
  1006. // frexp(-0) = -0, 0
  1007. // frexp(+inf) = +inf, 0
  1008. // frexp(-inf) = -inf, 0
  1009. // frexp(NaN) = NaN, 0
  1010. frexp :: proc{
  1011. frexp_f16, frexp_f16le, frexp_f16be,
  1012. frexp_f32, frexp_f32le, frexp_f32be,
  1013. frexp_f64, frexp_f64le, frexp_f64be,
  1014. }
  1015. @(require_results)
  1016. binomial :: proc "contextless" (n, k: int) -> int {
  1017. switch {
  1018. case k <= 0: return 1
  1019. case 2*k > n: return binomial(n, n-k)
  1020. }
  1021. b := n
  1022. for i in 2..<k {
  1023. b = (b * (n+1-i))/i
  1024. }
  1025. return b
  1026. }
  1027. @(require_results)
  1028. factorial :: proc "contextless" (n: int) -> int {
  1029. when size_of(int) == size_of(i64) {
  1030. @static table := [21]int{
  1031. 1,
  1032. 1,
  1033. 2,
  1034. 6,
  1035. 24,
  1036. 120,
  1037. 720,
  1038. 5_040,
  1039. 40_320,
  1040. 362_880,
  1041. 3_628_800,
  1042. 39_916_800,
  1043. 479_001_600,
  1044. 6_227_020_800,
  1045. 87_178_291_200,
  1046. 1_307_674_368_000,
  1047. 20_922_789_888_000,
  1048. 355_687_428_096_000,
  1049. 6_402_373_705_728_000,
  1050. 121_645_100_408_832_000,
  1051. 2_432_902_008_176_640_000,
  1052. }
  1053. } else {
  1054. @static table := [13]int{
  1055. 1,
  1056. 1,
  1057. 2,
  1058. 6,
  1059. 24,
  1060. 120,
  1061. 720,
  1062. 5_040,
  1063. 40_320,
  1064. 362_880,
  1065. 3_628_800,
  1066. 39_916_800,
  1067. 479_001_600,
  1068. }
  1069. }
  1070. return table[n]
  1071. }
  1072. @(require_results)
  1073. classify_f16 :: proc "contextless" (x: f16) -> Float_Class {
  1074. switch {
  1075. case x == 0:
  1076. i := transmute(i16)x
  1077. if i < 0 {
  1078. return .Neg_Zero
  1079. }
  1080. return .Zero
  1081. case x*0.25 == x:
  1082. if x < 0 {
  1083. return .Neg_Inf
  1084. }
  1085. return .Inf
  1086. case !(x == x):
  1087. return .NaN
  1088. }
  1089. u := transmute(u16)x
  1090. exp := int(u>>10) & (1<<5 - 1)
  1091. if exp == 0 {
  1092. return .Subnormal
  1093. }
  1094. return .Normal
  1095. }
  1096. @(require_results) classify_f16le :: proc "contextless" (x: f16le) -> Float_Class { return #force_inline classify_f16(f16(x)) }
  1097. @(require_results) classify_f16be :: proc "contextless" (x: f16be) -> Float_Class { return #force_inline classify_f16(f16(x)) }
  1098. @(require_results)
  1099. classify_f32 :: proc "contextless" (x: f32) -> Float_Class {
  1100. switch {
  1101. case x == 0:
  1102. i := transmute(i32)x
  1103. if i < 0 {
  1104. return .Neg_Zero
  1105. }
  1106. return .Zero
  1107. case x*0.5 == x:
  1108. if x < 0 {
  1109. return .Neg_Inf
  1110. }
  1111. return .Inf
  1112. case !(x == x):
  1113. return .NaN
  1114. }
  1115. u := transmute(u32)x
  1116. exp := int(u>>23) & (1<<8 - 1)
  1117. if exp == 0 {
  1118. return .Subnormal
  1119. }
  1120. return .Normal
  1121. }
  1122. @(require_results) classify_f32le :: proc "contextless" (x: f32le) -> Float_Class { return #force_inline classify_f32(f32(x)) }
  1123. @(require_results) classify_f32be :: proc "contextless" (x: f32be) -> Float_Class { return #force_inline classify_f32(f32(x)) }
  1124. @(require_results)
  1125. classify_f64 :: proc "contextless" (x: f64) -> Float_Class {
  1126. switch {
  1127. case x == 0:
  1128. i := transmute(i64)x
  1129. if i < 0 {
  1130. return .Neg_Zero
  1131. }
  1132. return .Zero
  1133. case x*0.5 == x:
  1134. if x < 0 {
  1135. return .Neg_Inf
  1136. }
  1137. return .Inf
  1138. case !(x == x):
  1139. return .NaN
  1140. }
  1141. u := transmute(u64)x
  1142. exp := int(u>>52) & (1<<11 - 1)
  1143. if exp == 0 {
  1144. return .Subnormal
  1145. }
  1146. return .Normal
  1147. }
  1148. @(require_results) classify_f64le :: proc "contextless" (x: f64le) -> Float_Class { return #force_inline classify_f64(f64(x)) }
  1149. @(require_results) classify_f64be :: proc "contextless" (x: f64be) -> Float_Class { return #force_inline classify_f64(f64(x)) }
  1150. // Returns the `Float_Class` of the value, i.e. whether normal, subnormal, zero, negative zero, NaN, infinity or
  1151. // negative infinity.
  1152. classify :: proc{
  1153. classify_f16, classify_f16le, classify_f16be,
  1154. classify_f32, classify_f32le, classify_f32be,
  1155. classify_f64, classify_f64le, classify_f64be,
  1156. }
  1157. @(require_results) is_nan_f16 :: proc "contextless" (x: f16) -> bool { return classify(x) == .NaN }
  1158. @(require_results) is_nan_f16le :: proc "contextless" (x: f16le) -> bool { return classify(x) == .NaN }
  1159. @(require_results) is_nan_f16be :: proc "contextless" (x: f16be) -> bool { return classify(x) == .NaN }
  1160. @(require_results) is_nan_f32 :: proc "contextless" (x: f32) -> bool { return classify(x) == .NaN }
  1161. @(require_results) is_nan_f32le :: proc "contextless" (x: f32le) -> bool { return classify(x) == .NaN }
  1162. @(require_results) is_nan_f32be :: proc "contextless" (x: f32be) -> bool { return classify(x) == .NaN }
  1163. @(require_results) is_nan_f64 :: proc "contextless" (x: f64) -> bool { return classify(x) == .NaN }
  1164. @(require_results) is_nan_f64le :: proc "contextless" (x: f64le) -> bool { return classify(x) == .NaN }
  1165. @(require_results) is_nan_f64be :: proc "contextless" (x: f64be) -> bool { return classify(x) == .NaN }
  1166. is_nan :: proc{
  1167. is_nan_f16, is_nan_f16le, is_nan_f16be,
  1168. is_nan_f32, is_nan_f32le, is_nan_f32be,
  1169. is_nan_f64, is_nan_f64le, is_nan_f64be,
  1170. }
  1171. // is_inf reports whether f is an infinity, according to sign.
  1172. // If sign > 0, is_inf reports whether f is positive infinity.
  1173. // If sign < 0, is_inf reports whether f is negative infinity.
  1174. // If sign == 0, is_inf reports whether f is either infinity.
  1175. @(require_results)
  1176. is_inf_f16 :: proc "contextless" (x: f16, sign: int = 0) -> bool {
  1177. class := classify(x)
  1178. switch {
  1179. case sign > 0:
  1180. return class == .Inf
  1181. case sign < 0:
  1182. return class == .Neg_Inf
  1183. }
  1184. return class == .Inf || class == .Neg_Inf
  1185. }
  1186. @(require_results)
  1187. is_inf_f16le :: proc "contextless" (x: f16le, sign: int = 0) -> bool {
  1188. return #force_inline is_inf_f16(f16(x), sign)
  1189. }
  1190. @(require_results)
  1191. is_inf_f16be :: proc "contextless" (x: f16be, sign: int = 0) -> bool {
  1192. return #force_inline is_inf_f16(f16(x), sign)
  1193. }
  1194. @(require_results)
  1195. is_inf_f32 :: proc "contextless" (x: f32, sign: int = 0) -> bool {
  1196. class := classify(x)
  1197. switch {
  1198. case sign > 0:
  1199. return class == .Inf
  1200. case sign < 0:
  1201. return class == .Neg_Inf
  1202. }
  1203. return class == .Inf || class == .Neg_Inf
  1204. }
  1205. @(require_results)
  1206. is_inf_f32le :: proc "contextless" (x: f32le, sign: int = 0) -> bool {
  1207. return #force_inline is_inf_f32(f32(x), sign)
  1208. }
  1209. @(require_results)
  1210. is_inf_f32be :: proc "contextless" (x: f32be, sign: int = 0) -> bool {
  1211. return #force_inline is_inf_f32(f32(x), sign)
  1212. }
  1213. @(require_results)
  1214. is_inf_f64 :: proc "contextless" (x: f64, sign: int = 0) -> bool {
  1215. class := classify(x)
  1216. switch {
  1217. case sign > 0:
  1218. return class == .Inf
  1219. case sign < 0:
  1220. return class == .Neg_Inf
  1221. }
  1222. return class == .Inf || class == .Neg_Inf
  1223. }
  1224. @(require_results)
  1225. is_inf_f64le :: proc "contextless" (x: f64le, sign: int = 0) -> bool {
  1226. return #force_inline is_inf_f64(f64(x), sign)
  1227. }
  1228. @(require_results)
  1229. is_inf_f64be :: proc "contextless" (x: f64be, sign: int = 0) -> bool {
  1230. return #force_inline is_inf_f64(f64(x), sign)
  1231. }
  1232. is_inf :: proc{
  1233. is_inf_f16, is_inf_f16le, is_inf_f16be,
  1234. is_inf_f32, is_inf_f32le, is_inf_f32be,
  1235. is_inf_f64, is_inf_f64le, is_inf_f64be,
  1236. }
  1237. @(require_results)
  1238. inf_f16 :: proc "contextless" (sign: int) -> f16 {
  1239. return f16(inf_f64(sign))
  1240. }
  1241. @(require_results)
  1242. inf_f16le :: proc "contextless" (sign: int) -> f16le {
  1243. return f16le(inf_f64(sign))
  1244. }
  1245. @(require_results)
  1246. inf_f16be :: proc "contextless" (sign: int) -> f16be {
  1247. return f16be(inf_f64(sign))
  1248. }
  1249. @(require_results)
  1250. inf_f32 :: proc "contextless" (sign: int) -> f32 {
  1251. return f32(inf_f64(sign))
  1252. }
  1253. @(require_results)
  1254. inf_f32le :: proc "contextless" (sign: int) -> f32le {
  1255. return f32le(inf_f64(sign))
  1256. }
  1257. @(require_results)
  1258. inf_f32be :: proc "contextless" (sign: int) -> f32be {
  1259. return f32be(inf_f64(sign))
  1260. }
  1261. @(require_results)
  1262. inf_f64 :: proc "contextless" (sign: int) -> f64 {
  1263. if sign >= 0 {
  1264. return 0h7ff00000_00000000
  1265. } else {
  1266. return 0hfff00000_00000000
  1267. }
  1268. }
  1269. @(require_results)
  1270. inf_f64le :: proc "contextless" (sign: int) -> f64le {
  1271. return f64le(inf_f64(sign))
  1272. }
  1273. @(require_results)
  1274. inf_f64be :: proc "contextless" (sign: int) -> f64be {
  1275. return f64be(inf_f64(sign))
  1276. }
  1277. @(require_results)
  1278. nan_f16 :: proc "contextless" () -> f16 {
  1279. return f16(nan_f64())
  1280. }
  1281. @(require_results)
  1282. nan_f16le :: proc "contextless" () -> f16le {
  1283. return f16le(nan_f64())
  1284. }
  1285. @(require_results)
  1286. nan_f16be :: proc "contextless" () -> f16be {
  1287. return f16be(nan_f64())
  1288. }
  1289. @(require_results)
  1290. nan_f32 :: proc "contextless" () -> f32 {
  1291. return f32(nan_f64())
  1292. }
  1293. @(require_results)
  1294. nan_f32le :: proc "contextless" () -> f32le {
  1295. return f32le(nan_f64())
  1296. }
  1297. @(require_results)
  1298. nan_f32be :: proc "contextless" () -> f32be {
  1299. return f32be(nan_f64())
  1300. }
  1301. @(require_results)
  1302. nan_f64 :: proc "contextless" () -> f64 {
  1303. return 0h7ff80000_00000001
  1304. }
  1305. @(require_results)
  1306. nan_f64le :: proc "contextless" () -> f64le {
  1307. return f64le(nan_f64())
  1308. }
  1309. @(require_results)
  1310. nan_f64be :: proc "contextless" () -> f64be {
  1311. return f64be(nan_f64())
  1312. }
  1313. @(require_results)
  1314. is_power_of_two :: proc "contextless" (x: int) -> bool {
  1315. return x > 0 && (x & (x-1)) == 0
  1316. }
  1317. @(require_results)
  1318. next_power_of_two :: proc "contextless" (x: int) -> int {
  1319. k := x -1
  1320. when size_of(int) == 8 {
  1321. k = k | (k >> 32)
  1322. }
  1323. k = k | (k >> 16)
  1324. k = k | (k >> 8)
  1325. k = k | (k >> 4)
  1326. k = k | (k >> 2)
  1327. k = k | (k >> 1)
  1328. k += 1 + int(x <= 0)
  1329. return k
  1330. }
  1331. @(require_results)
  1332. sum :: proc "contextless" (x: $T/[]$E) -> (res: E)
  1333. where intrinsics.type_is_numeric(E) {
  1334. for i in x {
  1335. res += i
  1336. }
  1337. return
  1338. }
  1339. @(require_results)
  1340. prod :: proc "contextless" (x: $T/[]$E) -> (res: E)
  1341. where intrinsics.type_is_numeric(E) {
  1342. res = 1
  1343. for i in x {
  1344. res *= i
  1345. }
  1346. return
  1347. }
  1348. cumsum_inplace :: proc "contextless" (x: $T/[]$E)
  1349. where intrinsics.type_is_numeric(E) {
  1350. for i in 1..<len(x) {
  1351. x[i] = x[i-1] + x[i]
  1352. }
  1353. }
  1354. @(require_results)
  1355. cumsum :: proc "contextless" (dst, src: $T/[]$E) -> T
  1356. where intrinsics.type_is_numeric(E) {
  1357. N := min(len(dst), len(src))
  1358. if N > 0 {
  1359. dst[0] = src[0]
  1360. for i in 1..<N {
  1361. dst[i] = dst[i-1] + src[i]
  1362. }
  1363. }
  1364. return dst[:N]
  1365. }
  1366. @(require_results)
  1367. atan2_f16 :: proc "contextless" (y, x: f16) -> f16 {
  1368. // TODO(bill): Better atan2_f16
  1369. return f16(atan2_f64(f64(y), f64(x)))
  1370. }
  1371. @(require_results)
  1372. atan2_f16le :: proc "contextless" (y, x: f16le) -> f16le {
  1373. // TODO(bill): Better atan2_f16
  1374. return f16le(atan2_f64(f64(y), f64(x)))
  1375. }
  1376. @(require_results)
  1377. atan2_f16be :: proc "contextless" (y, x: f16be) -> f16be {
  1378. // TODO(bill): Better atan2_f16
  1379. return f16be(atan2_f64(f64(y), f64(x)))
  1380. }
  1381. @(require_results)
  1382. atan2_f32 :: proc "contextless" (y, x: f32) -> f32 {
  1383. // TODO(bill): Better atan2_f32
  1384. return f32(atan2_f64(f64(y), f64(x)))
  1385. }
  1386. @(require_results)
  1387. atan2_f32le :: proc "contextless" (y, x: f32le) -> f32le {
  1388. // TODO(bill): Better atan2_f32
  1389. return f32le(atan2_f64(f64(y), f64(x)))
  1390. }
  1391. @(require_results)
  1392. atan2_f32be :: proc "contextless" (y, x: f32be) -> f32be {
  1393. // TODO(bill): Better atan2_f32
  1394. return f32be(atan2_f64(f64(y), f64(x)))
  1395. }
  1396. @(require_results)
  1397. atan2_f64 :: proc "contextless" (y, x: f64) -> f64 {
  1398. // TODO(bill): Faster atan2_f64 if possible
  1399. // The original C code:
  1400. // Stephen L. Moshier
  1401. // [email protected]
  1402. NAN :: 0h7fff_ffff_ffff_ffff
  1403. INF :: 0h7FF0_0000_0000_0000
  1404. PI :: 0h4009_21fb_5444_2d18
  1405. atan :: proc "contextless" (x: f64) -> f64 {
  1406. if x == 0 {
  1407. return x
  1408. }
  1409. if x > 0 {
  1410. return s_atan(x)
  1411. }
  1412. return -s_atan(-x)
  1413. }
  1414. // s_atan reduces its argument (known to be positive) to the range [0, 0.66] and calls x_atan.
  1415. s_atan :: proc "contextless" (x: f64) -> f64 {
  1416. MORE_BITS :: 6.123233995736765886130e-17 // pi/2 = PIO2 + MORE_BITS
  1417. TAN3PI08 :: 2.41421356237309504880 // tan(3*pi/8)
  1418. if x <= 0.66 {
  1419. return x_atan(x)
  1420. }
  1421. if x > TAN3PI08 {
  1422. return PI/2 - x_atan(1/x) + MORE_BITS
  1423. }
  1424. return PI/4 + x_atan((x-1)/(x+1)) + 0.5*MORE_BITS
  1425. }
  1426. // x_atan evaluates a series valid in the range [0, 0.66].
  1427. x_atan :: proc "contextless" (x: f64) -> f64 {
  1428. P0 :: -8.750608600031904122785e-01
  1429. P1 :: -1.615753718733365076637e+01
  1430. P2 :: -7.500855792314704667340e+01
  1431. P3 :: -1.228866684490136173410e+02
  1432. P4 :: -6.485021904942025371773e+01
  1433. Q0 :: +2.485846490142306297962e+01
  1434. Q1 :: +1.650270098316988542046e+02
  1435. Q2 :: +4.328810604912902668951e+02
  1436. Q3 :: +4.853903996359136964868e+02
  1437. Q4 :: +1.945506571482613964425e+02
  1438. z := x * x
  1439. z = z * ((((P0*z+P1)*z+P2)*z+P3)*z + P4) / (((((z+Q0)*z+Q1)*z+Q2)*z+Q3)*z + Q4)
  1440. z = x*z + x
  1441. return z
  1442. }
  1443. switch {
  1444. case is_nan(y) || is_nan(x):
  1445. return NAN
  1446. case y == 0:
  1447. if x >= 0 && !sign_bit(x) {
  1448. return copy_sign(0.0, y)
  1449. }
  1450. return copy_sign(PI, y)
  1451. case x == 0:
  1452. return copy_sign(PI/2, y)
  1453. case is_inf(x, 0):
  1454. if is_inf(x, 1) {
  1455. if is_inf(y, 0) {
  1456. return copy_sign(PI/4, y)
  1457. }
  1458. return copy_sign(0, y)
  1459. }
  1460. if is_inf(y, 0) {
  1461. return copy_sign(3*PI/4, y)
  1462. }
  1463. return copy_sign(PI, y)
  1464. case is_inf(y, 0):
  1465. return copy_sign(PI/2, y)
  1466. }
  1467. q := atan(y / x)
  1468. if x < 0 {
  1469. if q <= 0 {
  1470. return q + PI
  1471. }
  1472. return q - PI
  1473. }
  1474. return q
  1475. }
  1476. @(require_results)
  1477. atan2_f64le :: proc "contextless" (y, x: f64le) -> f64le {
  1478. // TODO(bill): Better atan2_f32
  1479. return f64le(atan2_f64(f64(y), f64(x)))
  1480. }
  1481. @(require_results)
  1482. atan2_f64be :: proc "contextless" (y, x: f64be) -> f64be {
  1483. // TODO(bill): Better atan2_f32
  1484. return f64be(atan2_f64(f64(y), f64(x)))
  1485. }
  1486. atan2 :: proc{
  1487. atan2_f64, atan2_f32, atan2_f16,
  1488. atan2_f64le, atan2_f64be,
  1489. atan2_f32le, atan2_f32be,
  1490. atan2_f16le, atan2_f16be,
  1491. }
  1492. @(require_results)
  1493. atan :: proc "contextless" (x: $T) -> T where intrinsics.type_is_float(T) {
  1494. return atan2(x, 1)
  1495. }
  1496. @(require_results)
  1497. asin_f64 :: proc "contextless" (x: f64) -> f64 {
  1498. /* origin: FreeBSD /usr/src/lib/msun/src/e_asin.c */
  1499. /*
  1500. * ====================================================
  1501. * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
  1502. *
  1503. * Developed at SunSoft, a Sun Microsystems, Inc. business.
  1504. * Permission to use, copy, modify, and distribute this
  1505. * software is freely granted, provided that this notice
  1506. * is preserved.
  1507. * ====================================================
  1508. */
  1509. pio2_hi :: 0h3FF921FB54442D18
  1510. pio2_lo :: 0h3C91A62633145C07
  1511. pS0 :: 0h3FC5555555555555
  1512. pS1 :: 0hBFD4D61203EB6F7D
  1513. pS2 :: 0h3FC9C1550E884455
  1514. pS3 :: 0hBFA48228B5688F3B
  1515. pS4 :: 0h3F49EFE07501B288
  1516. pS5 :: 0h3F023DE10DFDF709
  1517. qS1 :: 0hC0033A271C8A2D4B
  1518. qS2 :: 0h40002AE59C598AC8
  1519. qS3 :: 0hBFE6066C1B8D0159
  1520. qS4 :: 0h3FB3B8C5B12E9282
  1521. R :: #force_inline proc "contextless" (z: f64) -> f64 {
  1522. p, q: f64
  1523. p = z*(pS0+z*(pS1+z*(pS2+z*(pS3+z*(pS4+z*pS5)))))
  1524. q = 1.0+z*(qS1+z*(qS2+z*(qS3+z*qS4)))
  1525. return p/q
  1526. }
  1527. x := x
  1528. z, r, s: f64
  1529. dwords := transmute([2]u32)x
  1530. hx := dwords[1]
  1531. ix := hx & 0x7fffffff
  1532. /* |x| >= 1 or nan */
  1533. if ix >= 0x3ff00000 {
  1534. lx := dwords[0]
  1535. if (ix-0x3ff00000 | lx) == 0 {
  1536. /* asin(1) = +-pi/2 with inexact */
  1537. return x*pio2_hi + 1e-120
  1538. }
  1539. return 0/(x-x)
  1540. }
  1541. /* |x| < 0.5 */
  1542. if ix < 0x3fe00000 {
  1543. /* if 0x1p-1022 <= |x| < 0x1p-26, avoid raising underflow */
  1544. if ix < 0x3e500000 && ix >= 0x00100000 {
  1545. return x
  1546. }
  1547. return x + x*R(x*x)
  1548. }
  1549. /* 1 > |x| >= 0.5 */
  1550. z = (1 - abs(x))*0.5
  1551. s = sqrt(z)
  1552. r = R(z)
  1553. if ix >= 0x3fef3333 { /* if |x| > 0.975 */
  1554. x = pio2_hi-(2*(s+s*r)-pio2_lo)
  1555. } else {
  1556. f, c: f64
  1557. /* f+c = sqrt(z) */
  1558. f = s
  1559. (^u64)(&f)^ &= 0xffffffff_00000000
  1560. c = (z-f*f)/(s+f)
  1561. x = 0.5*pio2_hi - (2*s*r - (pio2_lo-2*c) - (0.5*pio2_hi-2*f))
  1562. }
  1563. return -x if hx >> 31 != 0 else x
  1564. }
  1565. @(require_results)
  1566. asin_f64le :: proc "contextless" (x: f64le) -> f64le {
  1567. return f64le(asin_f64(f64(x)))
  1568. }
  1569. @(require_results)
  1570. asin_f64be :: proc "contextless" (x: f64be) -> f64be {
  1571. return f64be(asin_f64(f64(x)))
  1572. }
  1573. @(require_results)
  1574. asin_f32 :: proc "contextless" (x: f32) -> f32 {
  1575. return f32(asin_f64(f64(x)))
  1576. }
  1577. @(require_results)
  1578. asin_f32le :: proc "contextless" (x: f32le) -> f32le {
  1579. return f32le(asin_f64(f64(x)))
  1580. }
  1581. @(require_results)
  1582. asin_f32be :: proc "contextless" (x: f32be) -> f32be {
  1583. return f32be(asin_f64(f64(x)))
  1584. }
  1585. @(require_results)
  1586. asin_f16 :: proc "contextless" (x: f16) -> f16 {
  1587. return f16(asin_f64(f64(x)))
  1588. }
  1589. @(require_results)
  1590. asin_f16le :: proc "contextless" (x: f16le) -> f16le {
  1591. return f16le(asin_f64(f64(x)))
  1592. }
  1593. @(require_results)
  1594. asin_f16be :: proc "contextless" (x: f16be) -> f16be {
  1595. return f16be(asin_f64(f64(x)))
  1596. }
  1597. asin :: proc{
  1598. asin_f64, asin_f32, asin_f16,
  1599. asin_f64le, asin_f64be,
  1600. asin_f32le, asin_f32be,
  1601. asin_f16le, asin_f16be,
  1602. }
  1603. @(require_results)
  1604. acos_f64 :: proc "contextless" (x: f64) -> f64 {
  1605. /* origin: FreeBSD /usr/src/lib/msun/src/e_acos.c */
  1606. /*
  1607. * ====================================================
  1608. * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
  1609. *
  1610. * Developed at SunSoft, a Sun Microsystems, Inc. business.
  1611. * Permission to use, copy, modify, and distribute this
  1612. * software is freely granted, provided that this notice
  1613. * is preserved.
  1614. * ====================================================
  1615. */
  1616. pio2_hi :: 0h3FF921FB54442D18
  1617. pio2_lo :: 0h3C91A62633145C07
  1618. pS0 :: 0h3FC5555555555555
  1619. pS1 :: 0hBFD4D61203EB6F7D
  1620. pS2 :: 0h3FC9C1550E884455
  1621. pS3 :: 0hBFA48228B5688F3B
  1622. pS4 :: 0h3F49EFE07501B288
  1623. pS5 :: 0h3F023DE10DFDF709
  1624. qS1 :: 0hC0033A271C8A2D4B
  1625. qS2 :: 0h40002AE59C598AC8
  1626. qS3 :: 0hBFE6066C1B8D0159
  1627. qS4 :: 0h3FB3B8C5B12E9282
  1628. R :: #force_inline proc "contextless" (z: f64) -> f64 {
  1629. p, q: f64
  1630. p = z*(pS0+z*(pS1+z*(pS2+z*(pS3+z*(pS4+z*pS5)))))
  1631. q = 1.0+z*(qS1+z*(qS2+z*(qS3+z*qS4)))
  1632. return p/q
  1633. }
  1634. z, w, s, c, df: f64
  1635. dwords := transmute([2]u32)x
  1636. hx := dwords[1]
  1637. ix := hx & 0x7fffffff
  1638. /* |x| >= 1 or nan */
  1639. if ix >= 0x3ff00000 {
  1640. lx := dwords[0]
  1641. if (ix-0x3ff00000 | lx) == 0 {
  1642. /* acos(1)=0, acos(-1)=pi */
  1643. if hx >> 31 != 0 {
  1644. return 2*pio2_hi + 1e-120
  1645. }
  1646. return 0
  1647. }
  1648. return 0/(x-x)
  1649. }
  1650. /* |x| < 0.5 */
  1651. if ix < 0x3fe00000 {
  1652. if ix <= 0x3c600000 { /* |x| < 2**-57 */
  1653. return pio2_hi + 1e-120
  1654. }
  1655. return pio2_hi - (x - (pio2_lo-x*R(x*x)))
  1656. }
  1657. /* x < -0.5 */
  1658. if hx >> 31 != 0 {
  1659. z = (1.0+x)*0.5
  1660. s = sqrt(z)
  1661. w = R(z)*s-pio2_lo
  1662. return 2*(pio2_hi - (s+w))
  1663. }
  1664. /* x > 0.5 */
  1665. z = (1.0-x)*0.5
  1666. s = sqrt(z)
  1667. df = s
  1668. (^u64)(&df)^ &= 0xffffffff_00000000
  1669. c = (z-df*df)/(s+df)
  1670. w = R(z)*s+c
  1671. return 2*(df+w)
  1672. }
  1673. @(require_results)
  1674. acos_f64le :: proc "contextless" (x: f64le) -> f64le {
  1675. return f64le(acos_f64(f64(x)))
  1676. }
  1677. @(require_results)
  1678. acos_f64be :: proc "contextless" (x: f64be) -> f64be {
  1679. return f64be(acos_f64(f64(x)))
  1680. }
  1681. @(require_results)
  1682. acos_f32 :: proc "contextless" (x: f32) -> f32 {
  1683. return f32(acos_f64(f64(x)))
  1684. }
  1685. @(require_results)
  1686. acos_f32le :: proc "contextless" (x: f32le) -> f32le {
  1687. return f32le(acos_f64(f64(x)))
  1688. }
  1689. @(require_results)
  1690. acos_f32be :: proc "contextless" (x: f32be) -> f32be {
  1691. return f32be(acos_f64(f64(x)))
  1692. }
  1693. @(require_results)
  1694. acos_f16 :: proc "contextless" (x: f16) -> f16 {
  1695. return f16(acos_f64(f64(x)))
  1696. }
  1697. @(require_results)
  1698. acos_f16le :: proc "contextless" (x: f16le) -> f16le {
  1699. return f16le(acos_f64(f64(x)))
  1700. }
  1701. @(require_results)
  1702. acos_f16be :: proc "contextless" (x: f16be) -> f16be {
  1703. return f16be(acos_f64(f64(x)))
  1704. }
  1705. acos :: proc{
  1706. acos_f64, acos_f32, acos_f16,
  1707. acos_f64le, acos_f64be,
  1708. acos_f32le, acos_f32be,
  1709. acos_f16le, acos_f16be,
  1710. }
  1711. @(require_results)
  1712. sinh :: proc "contextless" (x: $T) -> T where intrinsics.type_is_float(T) {
  1713. return copy_sign(((exp(x) - exp(-x))*0.5), x)
  1714. }
  1715. @(require_results)
  1716. cosh :: proc "contextless" (x: $T) -> T where intrinsics.type_is_float(T) {
  1717. return ((exp(x) + exp(-x))*0.5)
  1718. }
  1719. @(require_results)
  1720. tanh :: proc "contextless" (y: $T) -> T where intrinsics.type_is_float(T) {
  1721. P0 :: -9.64399179425052238628e-1
  1722. P1 :: -9.92877231001918586564e1
  1723. P2 :: -1.61468768441708447952e3
  1724. Q0 :: +1.12811678491632931402e2
  1725. Q1 :: +2.23548839060100448583e3
  1726. Q2 :: +4.84406305325125486048e3
  1727. MAXLOG :: 8.8029691931113054295988e+01 // log(2**127)
  1728. x := f64(y)
  1729. z := abs(x)
  1730. switch {
  1731. case z > 0.5*MAXLOG:
  1732. if x < 0 {
  1733. return -1
  1734. }
  1735. return 1
  1736. case z >= 0.625:
  1737. s := exp(2 * z)
  1738. z = 1 - 2/(s+1)
  1739. if x < 0 {
  1740. z = -z
  1741. }
  1742. case:
  1743. if x == 0 {
  1744. return T(x)
  1745. }
  1746. s := x * x
  1747. z = x + x*s*((P0*s+P1)*s+P2)/(((s+Q0)*s+Q1)*s+Q2)
  1748. }
  1749. return T(z)
  1750. }
  1751. @(require_results)
  1752. asinh :: proc "contextless" (y: $T) -> T where intrinsics.type_is_float(T) {
  1753. // The original C code, the long comment, and the constants
  1754. // below are from FreeBSD's /usr/src/lib/msun/src/s_asinh.c
  1755. // and came with this notice.
  1756. //
  1757. // ====================================================
  1758. // Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
  1759. //
  1760. // Developed at SunPro, a Sun Microsystems, Inc. business.
  1761. // Permission to use, copy, modify, and distribute this
  1762. // software is freely granted, provided that this notice
  1763. // is preserved.
  1764. // ====================================================
  1765. LN2 :: 0h3FE62E42FEFA39EF
  1766. NEAR_ZERO :: 1.0 / (1 << 28)
  1767. LARGE :: 1 << 28
  1768. x := f64(y)
  1769. if is_nan(x) || is_inf(x) {
  1770. return T(x)
  1771. }
  1772. sign := false
  1773. if x < 0 {
  1774. x = -x
  1775. sign = true
  1776. }
  1777. temp: f64
  1778. switch {
  1779. case x > LARGE:
  1780. temp = ln(x) + LN2
  1781. case x > 2:
  1782. temp = ln(2*x + 1/(sqrt(x*x + 1) + x))
  1783. case x < NEAR_ZERO:
  1784. temp = x
  1785. case:
  1786. temp = log1p(x + x*x/(1 + sqrt(1 + x*x)))
  1787. }
  1788. if sign {
  1789. temp = -temp
  1790. }
  1791. return T(temp)
  1792. }
  1793. @(require_results)
  1794. acosh :: proc "contextless" (y: $T) -> T where intrinsics.type_is_float(T) {
  1795. // The original C code, the long comment, and the constants
  1796. // below are from FreeBSD's /usr/src/lib/msun/src/e_acosh.c
  1797. // and came with this notice.
  1798. //
  1799. // ====================================================
  1800. // Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
  1801. //
  1802. // Developed at SunPro, a Sun Microsystems, Inc. business.
  1803. // Permission to use, copy, modify, and distribute this
  1804. // software is freely granted, provided that this notice
  1805. // is preserved.
  1806. // ====================================================
  1807. LARGE :: 1<<28
  1808. LN2 :: 0h3FE62E42FEFA39EF
  1809. x := f64(y)
  1810. switch {
  1811. case x < 1 || is_nan(x):
  1812. return T(nan_f64())
  1813. case x == 1:
  1814. return 0
  1815. case x >= LARGE:
  1816. return T(ln(x) + LN2)
  1817. case x > 2:
  1818. return T(ln(2*x - 1/(x+sqrt(x*x-1))))
  1819. }
  1820. t := x-1
  1821. return T(log1p(t + sqrt(2*t + t*t)))
  1822. }
  1823. @(require_results)
  1824. atanh :: proc "contextless" (y: $T) -> T where intrinsics.type_is_float(T) {
  1825. // The original C code, the long comment, and the constants
  1826. // below are from FreeBSD's /usr/src/lib/msun/src/e_atanh.c
  1827. // and came with this notice.
  1828. //
  1829. // ====================================================
  1830. // Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
  1831. //
  1832. // Developed at SunPro, a Sun Microsystems, Inc. business.
  1833. // Permission to use, copy, modify, and distribute this
  1834. // software is freely granted, provided that this notice
  1835. // is preserved.
  1836. // ====================================================
  1837. NEAR_ZERO :: 1.0 / (1 << 28)
  1838. x := f64(y)
  1839. switch {
  1840. case x < -1 || x > 1 || is_nan(x):
  1841. return T(nan_f64())
  1842. case x == 1:
  1843. return T(inf_f64(1))
  1844. case x == -1:
  1845. return T(inf_f64(-1))
  1846. }
  1847. sign := false
  1848. if x < 0 {
  1849. x = -x
  1850. sign = true
  1851. }
  1852. temp: f64
  1853. switch {
  1854. case x < NEAR_ZERO:
  1855. temp = x
  1856. case x < 0.5:
  1857. temp = x + x
  1858. temp = 0.5 * log1p(temp + temp*x/(1-x))
  1859. case:
  1860. temp = 0.5 * log1p((x+x)/(1-x))
  1861. }
  1862. if sign {
  1863. temp = -temp
  1864. }
  1865. return T(temp)
  1866. }
  1867. @(require_results)
  1868. ilogb_f16 :: proc "contextless" (val: f16) -> int {
  1869. switch {
  1870. case val == 0: return int(min(i32))
  1871. case is_nan(val): return int(max(i32))
  1872. case is_inf(val): return int(max(i32))
  1873. }
  1874. x, exp := normalize_f16(val)
  1875. return int(((transmute(u16)x)>>F16_SHIFT)&F16_MASK) - F16_BIAS + exp
  1876. }
  1877. @(require_results)
  1878. ilogb_f32 :: proc "contextless" (val: f32) -> int {
  1879. switch {
  1880. case val == 0: return int(min(i32))
  1881. case is_nan(val): return int(max(i32))
  1882. case is_inf(val): return int(max(i32))
  1883. }
  1884. x, exp := normalize_f32(val)
  1885. return int(((transmute(u32)x)>>F32_SHIFT)&F32_MASK) - F32_BIAS + exp
  1886. }
  1887. @(require_results)
  1888. ilogb_f64 :: proc "contextless" (val: f64) -> int {
  1889. switch {
  1890. case val == 0: return int(min(i32))
  1891. case is_nan(val): return int(max(i32))
  1892. case is_inf(val): return int(max(i32))
  1893. }
  1894. x, exp := normalize_f64(val)
  1895. return int(((transmute(u64)x)>>F64_SHIFT)&F64_MASK) - F64_BIAS + exp
  1896. }
  1897. @(require_results) ilogb_f16le :: proc "contextless" (value: f16le) -> int { return ilogb_f16(f16(value)) }
  1898. @(require_results) ilogb_f16be :: proc "contextless" (value: f16be) -> int { return ilogb_f16(f16(value)) }
  1899. @(require_results) ilogb_f32le :: proc "contextless" (value: f32le) -> int { return ilogb_f32(f32(value)) }
  1900. @(require_results) ilogb_f32be :: proc "contextless" (value: f32be) -> int { return ilogb_f32(f32(value)) }
  1901. @(require_results) ilogb_f64le :: proc "contextless" (value: f64le) -> int { return ilogb_f64(f64(value)) }
  1902. @(require_results) ilogb_f64be :: proc "contextless" (value: f64be) -> int { return ilogb_f64(f64(value)) }
  1903. ilogb :: proc {
  1904. ilogb_f16,
  1905. ilogb_f32,
  1906. ilogb_f64,
  1907. ilogb_f16le,
  1908. ilogb_f16be,
  1909. ilogb_f32le,
  1910. ilogb_f32be,
  1911. ilogb_f64le,
  1912. ilogb_f64be,
  1913. }
  1914. @(require_results)
  1915. logb_f16 :: proc "contextless" (val: f16) -> f16 {
  1916. switch {
  1917. case val == 0: return inf_f16(-1)
  1918. case is_inf(val): return inf_f16(+1)
  1919. case is_nan(val): return val
  1920. }
  1921. return f16(ilogb(val))
  1922. }
  1923. @(require_results)
  1924. logb_f32 :: proc "contextless" (val: f32) -> f32 {
  1925. switch {
  1926. case val == 0: return inf_f32(-1)
  1927. case is_inf(val): return inf_f32(+1)
  1928. case is_nan(val): return val
  1929. }
  1930. return f32(ilogb(val))
  1931. }
  1932. @(require_results)
  1933. logb_f64 :: proc "contextless" (val: f64) -> f64 {
  1934. switch {
  1935. case val == 0: return inf_f64(-1)
  1936. case is_inf(val): return inf_f64(+1)
  1937. case is_nan(val): return val
  1938. }
  1939. return f64(ilogb(val))
  1940. }
  1941. @(require_results) logb_f16le :: proc "contextless" (value: f16le) -> f16le { return f16le(logb_f16(f16(value))) }
  1942. @(require_results) logb_f16be :: proc "contextless" (value: f16be) -> f16be { return f16be(logb_f16(f16(value))) }
  1943. @(require_results) logb_f32le :: proc "contextless" (value: f32le) -> f32le { return f32le(logb_f32(f32(value))) }
  1944. @(require_results) logb_f32be :: proc "contextless" (value: f32be) -> f32be { return f32be(logb_f32(f32(value))) }
  1945. @(require_results) logb_f64le :: proc "contextless" (value: f64le) -> f64le { return f64le(logb_f64(f64(value))) }
  1946. @(require_results) logb_f64be :: proc "contextless" (value: f64be) -> f64be { return f64be(logb_f64(f64(value))) }
  1947. logb :: proc {
  1948. logb_f16,
  1949. logb_f32,
  1950. logb_f64,
  1951. logb_f16le,
  1952. logb_f16be,
  1953. logb_f32le,
  1954. logb_f32be,
  1955. logb_f64le,
  1956. logb_f64be,
  1957. }
  1958. @(require_results)
  1959. nextafter_f16 :: proc "contextless" (x, y: f16) -> (r: f16) {
  1960. switch {
  1961. case is_nan(x) || is_nan(y):
  1962. r = nan_f16()
  1963. case x == y:
  1964. r = x
  1965. case x == 0:
  1966. r = copy_sign_f16(1, y)
  1967. case (y > x) == (x > 0):
  1968. r = transmute(f16)(transmute(u16)x + 1)
  1969. case:
  1970. r = transmute(f16)(transmute(u16)x - 1)
  1971. }
  1972. return
  1973. }
  1974. @(require_results)
  1975. nextafter_f32 :: proc "contextless" (x, y: f32) -> (r: f32) {
  1976. switch {
  1977. case is_nan(x) || is_nan(y):
  1978. r = nan_f32()
  1979. case x == y:
  1980. r = x
  1981. case x == 0:
  1982. r = copy_sign_f32(1, y)
  1983. case (y > x) == (x > 0):
  1984. r = transmute(f32)(transmute(u32)x + 1)
  1985. case:
  1986. r = transmute(f32)(transmute(u32)x - 1)
  1987. }
  1988. return
  1989. }
  1990. @(require_results)
  1991. nextafter_f64 :: proc "contextless" (x, y: f64) -> (r: f64) {
  1992. switch {
  1993. case is_nan(x) || is_nan(y):
  1994. r = nan_f64()
  1995. case x == y:
  1996. r = x
  1997. case x == 0:
  1998. r = copy_sign_f64(1, y)
  1999. case (y > x) == (x > 0):
  2000. r = transmute(f64)(transmute(u64)x + 1)
  2001. case:
  2002. r = transmute(f64)(transmute(u64)x - 1)
  2003. }
  2004. return
  2005. }
  2006. @(require_results) nextafter_f16le :: proc "contextless" (x, y: f16le) -> (r: f16le) { return f16le(nextafter_f16(f16(x), f16(y))) }
  2007. @(require_results) nextafter_f16be :: proc "contextless" (x, y: f16be) -> (r: f16be) { return f16be(nextafter_f16(f16(x), f16(y))) }
  2008. @(require_results) nextafter_f32le :: proc "contextless" (x, y: f32le) -> (r: f32le) { return f32le(nextafter_f32(f32(x), f32(y))) }
  2009. @(require_results) nextafter_f32be :: proc "contextless" (x, y: f32be) -> (r: f32be) { return f32be(nextafter_f32(f32(x), f32(y))) }
  2010. @(require_results) nextafter_f64le :: proc "contextless" (x, y: f64le) -> (r: f64le) { return f64le(nextafter_f64(f64(x), f64(y))) }
  2011. @(require_results) nextafter_f64be :: proc "contextless" (x, y: f64be) -> (r: f64be) { return f64be(nextafter_f64(f64(x), f64(y))) }
  2012. nextafter :: proc{
  2013. nextafter_f16, nextafter_f16le, nextafter_f16be,
  2014. nextafter_f32, nextafter_f32le, nextafter_f32be,
  2015. nextafter_f64, nextafter_f64le, nextafter_f64be,
  2016. }
  2017. @(require_results)
  2018. signbit_f16 :: proc "contextless" (x: f16) -> bool {
  2019. return (transmute(u16)x)&(1<<15) != 0
  2020. }
  2021. @(require_results)
  2022. signbit_f32 :: proc "contextless" (x: f32) -> bool {
  2023. return (transmute(u32)x)&(1<<31) != 0
  2024. }
  2025. @(require_results)
  2026. signbit_f64 :: proc "contextless" (x: f64) -> bool {
  2027. return (transmute(u64)x)&(1<<63) != 0
  2028. }
  2029. @(require_results) signbit_f16le :: proc "contextless" (x: f16le) -> bool { return signbit_f16(f16(x)) }
  2030. @(require_results) signbit_f32le :: proc "contextless" (x: f32le) -> bool { return signbit_f32(f32(x)) }
  2031. @(require_results) signbit_f64le :: proc "contextless" (x: f64le) -> bool { return signbit_f64(f64(x)) }
  2032. @(require_results) signbit_f16be :: proc "contextless" (x: f16be) -> bool { return signbit_f16(f16(x)) }
  2033. @(require_results) signbit_f32be :: proc "contextless" (x: f32be) -> bool { return signbit_f32(f32(x)) }
  2034. @(require_results) signbit_f64be :: proc "contextless" (x: f64be) -> bool { return signbit_f64(f64(x)) }
  2035. signbit :: proc{
  2036. signbit_f16, signbit_f16le, signbit_f16be,
  2037. signbit_f32, signbit_f32le, signbit_f32be,
  2038. signbit_f64, signbit_f64le, signbit_f64be,
  2039. }
  2040. @(require_results)
  2041. hypot_f16 :: proc "contextless" (x, y: f16) -> (r: f16) {
  2042. p, q := abs(x), abs(y)
  2043. switch {
  2044. case is_inf(p, 1) || is_inf(q, 1):
  2045. return inf_f16(1)
  2046. case is_nan(p) || is_nan(q):
  2047. return nan_f16()
  2048. }
  2049. if p < q {
  2050. p, q = q, p
  2051. }
  2052. if p == 0 {
  2053. return 0
  2054. }
  2055. q = q / p
  2056. return p * sqrt(1+q*q)
  2057. }
  2058. @(require_results)
  2059. hypot_f32 :: proc "contextless" (x, y: f32) -> (r: f32) {
  2060. p, q := abs(x), abs(y)
  2061. switch {
  2062. case is_inf(p, 1) || is_inf(q, 1):
  2063. return inf_f32(1)
  2064. case is_nan(p) || is_nan(q):
  2065. return nan_f32()
  2066. }
  2067. if p < q {
  2068. p, q = q, p
  2069. }
  2070. if p == 0 {
  2071. return 0
  2072. }
  2073. q = q / p
  2074. return p * sqrt(1+q*q)
  2075. }
  2076. @(require_results)
  2077. hypot_f64 :: proc "contextless" (x, y: f64) -> (r: f64) {
  2078. p, q := abs(x), abs(y)
  2079. switch {
  2080. case is_inf(p, 1) || is_inf(q, 1):
  2081. return inf_f64(1)
  2082. case is_nan(p) || is_nan(q):
  2083. return nan_f64()
  2084. }
  2085. if p < q {
  2086. p, q = q, p
  2087. }
  2088. if p == 0 {
  2089. return 0
  2090. }
  2091. q = q / p
  2092. return p * sqrt(1+q*q)
  2093. }
  2094. @(require_results) hypot_f16le :: proc "contextless" (x, y: f16le) -> (r: f16le) { return f16le(hypot_f16(f16(x), f16(y))) }
  2095. @(require_results) hypot_f16be :: proc "contextless" (x, y: f16be) -> (r: f16be) { return f16be(hypot_f16(f16(x), f16(y))) }
  2096. @(require_results) hypot_f32le :: proc "contextless" (x, y: f32le) -> (r: f32le) { return f32le(hypot_f32(f32(x), f32(y))) }
  2097. @(require_results) hypot_f32be :: proc "contextless" (x, y: f32be) -> (r: f32be) { return f32be(hypot_f32(f32(x), f32(y))) }
  2098. @(require_results) hypot_f64le :: proc "contextless" (x, y: f64le) -> (r: f64le) { return f64le(hypot_f64(f64(x), f64(y))) }
  2099. @(require_results) hypot_f64be :: proc "contextless" (x, y: f64be) -> (r: f64be) { return f64be(hypot_f64(f64(x), f64(y))) }
  2100. // hypot returns Sqrt(p*p + q*q), taking care to avoid unnecessary overflow and underflow.
  2101. //
  2102. // Special cases:
  2103. // hypot(±Inf, q) = +Inf
  2104. // hypot(p, ±Inf) = +Inf
  2105. // hypot(NaN, q) = NaN
  2106. // hypot(p, NaN) = NaN
  2107. hypot :: proc{
  2108. hypot_f16, hypot_f16le, hypot_f16be,
  2109. hypot_f32, hypot_f32le, hypot_f32be,
  2110. hypot_f64, hypot_f64le, hypot_f64be,
  2111. }
  2112. F16_DIG :: 3
  2113. F16_EPSILON :: 0.00097656
  2114. F16_GUARD :: 0
  2115. F16_MANT_DIG :: 11
  2116. F16_MAX :: 65504.0
  2117. F16_MAX_10_EXP :: 4
  2118. F16_MAX_EXP :: 15
  2119. F16_MIN :: 6.10351562e-5
  2120. F16_MIN_10_EXP :: -4
  2121. F16_MIN_EXP :: -14
  2122. F16_NORMALIZE :: 0
  2123. F16_RADIX :: 2
  2124. F16_ROUNDS :: 1
  2125. F32_DIG :: 6
  2126. F32_EPSILON :: 1.192092896e-07
  2127. F32_GUARD :: 0
  2128. F32_MANT_DIG :: 24
  2129. F32_MAX :: 3.402823466e+38
  2130. F32_MAX_10_EXP :: 38
  2131. F32_MAX_EXP :: 128
  2132. F32_MIN :: 1.175494351e-38
  2133. F32_MIN_10_EXP :: -37
  2134. F32_MIN_EXP :: -125
  2135. F32_NORMALIZE :: 0
  2136. F32_RADIX :: 2
  2137. F32_ROUNDS :: 1
  2138. F64_DIG :: 15 // Number of representable decimal digits.
  2139. F64_EPSILON :: 2.2204460492503131e-016 // Smallest number such that `1.0 + F64_EPSILON != 1.0`.
  2140. F64_MANT_DIG :: 53 // Number of bits in the mantissa.
  2141. F64_MAX :: 1.7976931348623158e+308 // Maximum representable value.
  2142. F64_MAX_10_EXP :: 308 // Maximum base-10 exponent yielding normalized value.
  2143. F64_MAX_EXP :: 1024 // One greater than the maximum possible base-2 exponent yielding normalized value.
  2144. F64_MIN :: 2.2250738585072014e-308 // Minimum positive normalized value.
  2145. F64_MIN_10_EXP :: -307 // Minimum base-10 exponent yielding normalized value.
  2146. F64_MIN_EXP :: -1021 // One greater than the minimum possible base-2 exponent yielding normalized value.
  2147. F64_RADIX :: 2 // Exponent radix.
  2148. F64_ROUNDS :: 1 // Addition rounding: near.
  2149. F16_MASK :: 0x1f
  2150. F16_SHIFT :: 16 - 6
  2151. F16_BIAS :: 0xf
  2152. F32_MASK :: 0xff
  2153. F32_SHIFT :: 32 - 9
  2154. F32_BIAS :: 0x7f
  2155. F64_MASK :: 0x7ff
  2156. F64_SHIFT :: 64 - 12
  2157. F64_BIAS :: 0x3ff
  2158. INF_F16 :: f16(0h7C00)
  2159. NEG_INF_F16 :: f16(0hFC00)
  2160. SNAN_F16 :: f16(0h7C01)
  2161. QNAN_F16 :: f16(0h7E01)
  2162. INF_F32 :: f32(0h7F80_0000)
  2163. NEG_INF_F32 :: f32(0hFF80_0000)
  2164. SNAN_F32 :: f32(0hFF80_0001)
  2165. QNAN_F32 :: f32(0hFFC0_0001)
  2166. INF_F64 :: f64(0h7FF0_0000_0000_0000)
  2167. NEG_INF_F64 :: f64(0hFFF0_0000_0000_0000)
  2168. SNAN_F64 :: f64(0h7FF0_0000_0000_0001)
  2169. QNAN_F64 :: f64(0h7FF8_0000_0000_0001)