a00045_source.html 7.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144
  1. <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
  2. <html xmlns="http://www.w3.org/1999/xhtml">
  3. <head>
  4. <meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
  5. <title>intrinsic_exponential.hpp Source File</title>
  6. <link href="tabs.css" rel="stylesheet" type="text/css"/>
  7. <link href="doxygen.css" rel="stylesheet" type="text/css" />
  8. </head>
  9. <body>
  10. <div id="top"><!-- do not remove this div! -->
  11. <div id="titlearea">
  12. <table cellspacing="0" cellpadding="0">
  13. <tbody>
  14. <tr style="height: 56px;">
  15. <td id="projectlogo"><img alt="Logo" src="logo-mini.png"/></td>
  16. </tr>
  17. </tbody>
  18. </table>
  19. </div>
  20. <!-- Generated by Doxygen 1.7.5.1 -->
  21. <div id="navrow1" class="tabs">
  22. <ul class="tablist">
  23. <li><a href="index.html"><span>Main&#160;Page</span></a></li>
  24. <li><a href="pages.html"><span>Related&#160;Pages</span></a></li>
  25. <li><a href="modules.html"><span>Modules</span></a></li>
  26. <li><a href="annotated.html"><span>Classes</span></a></li>
  27. <li class="current"><a href="files.html"><span>Files</span></a></li>
  28. </ul>
  29. </div>
  30. <div id="navrow2" class="tabs2">
  31. <ul class="tablist">
  32. <li><a href="files.html"><span>File&#160;List</span></a></li>
  33. </ul>
  34. </div>
  35. <div class="header">
  36. <div class="headertitle">
  37. <div class="title">intrinsic_exponential.hpp</div> </div>
  38. </div>
  39. <div class="contents">
  40. <a href="a00045.html">Go to the documentation of this file.</a><div class="fragment"><pre class="fragment"><a name="l00001"></a>00001
  41. <a name="l00002"></a>00002
  42. <a name="l00003"></a>00003
  43. <a name="l00004"></a>00004
  44. <a name="l00005"></a>00005
  45. <a name="l00006"></a>00006
  46. <a name="l00007"></a>00007
  47. <a name="l00008"></a>00008
  48. <a name="l00009"></a>00009
  49. <a name="l00010"></a>00010
  50. <a name="l00011"></a>00011
  51. <a name="l00012"></a>00012
  52. <a name="l00013"></a>00013
  53. <a name="l00014"></a>00014
  54. <a name="l00015"></a>00015
  55. <a name="l00016"></a>00016
  56. <a name="l00017"></a>00017
  57. <a name="l00018"></a>00018
  58. <a name="l00019"></a>00019
  59. <a name="l00020"></a>00020
  60. <a name="l00021"></a>00021
  61. <a name="l00022"></a>00022
  62. <a name="l00023"></a>00023
  63. <a name="l00024"></a>00024
  64. <a name="l00025"></a>00025
  65. <a name="l00026"></a>00026
  66. <a name="l00027"></a>00027
  67. <a name="l00028"></a>00028
  68. <a name="l00029"></a>00029 <span class="preprocessor">#ifndef glm_detail_intrinsic_exponential</span>
  69. <a name="l00030"></a>00030 <span class="preprocessor"></span><span class="preprocessor">#define glm_detail_intrinsic_exponential</span>
  70. <a name="l00031"></a>00031 <span class="preprocessor"></span>
  71. <a name="l00032"></a>00032 <span class="preprocessor">#include &quot;<a class="code" href="a00083.html" title="OpenGL Mathematics (glm.g-truc.net)">setup.hpp</a>&quot;</span>
  72. <a name="l00033"></a>00033
  73. <a name="l00034"></a>00034 <span class="preprocessor">#if((GLM_ARCH &amp; GLM_ARCH_SSE2) != GLM_ARCH_SSE2)</span>
  74. <a name="l00035"></a>00035 <span class="preprocessor"></span><span class="preprocessor"># error &quot;SSE2 instructions not supported or enabled&quot;</span>
  75. <a name="l00036"></a>00036 <span class="preprocessor"></span><span class="preprocessor">#else</span>
  76. <a name="l00037"></a>00037 <span class="preprocessor"></span>
  77. <a name="l00038"></a>00038 <span class="keyword">namespace </span>glm{
  78. <a name="l00039"></a>00039 <span class="keyword">namespace </span>detail
  79. <a name="l00040"></a>00040 {
  80. <a name="l00041"></a>00041 <span class="comment">/*</span>
  81. <a name="l00042"></a>00042 <span class="comment">GLM_FUNC_QUALIFIER __m128 sse_rsqrt_nr_ss(__m128 const x)</span>
  82. <a name="l00043"></a>00043 <span class="comment">{</span>
  83. <a name="l00044"></a>00044 <span class="comment"> __m128 recip = _mm_rsqrt_ss( x ); // &quot;estimate&quot; opcode</span>
  84. <a name="l00045"></a>00045 <span class="comment"> const static __m128 three = { 3, 3, 3, 3 }; // aligned consts for fast load</span>
  85. <a name="l00046"></a>00046 <span class="comment"> const static __m128 half = { 0.5,0.5,0.5,0.5 };</span>
  86. <a name="l00047"></a>00047 <span class="comment"> __m128 halfrecip = _mm_mul_ss( half, recip );</span>
  87. <a name="l00048"></a>00048 <span class="comment"> __m128 threeminus_xrr = _mm_sub_ss( three, _mm_mul_ss( x, _mm_mul_ss ( recip, recip ) ) );</span>
  88. <a name="l00049"></a>00049 <span class="comment"> return _mm_mul_ss( halfrecip, threeminus_xrr );</span>
  89. <a name="l00050"></a>00050 <span class="comment">}</span>
  90. <a name="l00051"></a>00051 <span class="comment"> </span>
  91. <a name="l00052"></a>00052 <span class="comment">GLM_FUNC_QUALIFIER __m128 sse_normalize_fast_ps( float * RESTRICT vOut, float * RESTRICT vIn )</span>
  92. <a name="l00053"></a>00053 <span class="comment">{</span>
  93. <a name="l00054"></a>00054 <span class="comment"> __m128 x = _mm_load_ss(&amp;vIn[0]);</span>
  94. <a name="l00055"></a>00055 <span class="comment"> __m128 y = _mm_load_ss(&amp;vIn[1]);</span>
  95. <a name="l00056"></a>00056 <span class="comment"> __m128 z = _mm_load_ss(&amp;vIn[2]);</span>
  96. <a name="l00057"></a>00057 <span class="comment"> </span>
  97. <a name="l00058"></a>00058 <span class="comment"> const __m128 l = // compute x*x + y*y + z*z</span>
  98. <a name="l00059"></a>00059 <span class="comment"> _mm_add_ss(</span>
  99. <a name="l00060"></a>00060 <span class="comment"> _mm_add_ss( _mm_mul_ss(x,x),</span>
  100. <a name="l00061"></a>00061 <span class="comment"> _mm_mul_ss(y,y)</span>
  101. <a name="l00062"></a>00062 <span class="comment"> ),</span>
  102. <a name="l00063"></a>00063 <span class="comment"> _mm_mul_ss( z, z )</span>
  103. <a name="l00064"></a>00064 <span class="comment"> );</span>
  104. <a name="l00065"></a>00065 <span class="comment"> </span>
  105. <a name="l00066"></a>00066 <span class="comment"> </span>
  106. <a name="l00067"></a>00067 <span class="comment"> const __m128 rsqt = _mm_rsqrt_nr_ss( l );</span>
  107. <a name="l00068"></a>00068 <span class="comment"> _mm_store_ss( &amp;vOut[0] , _mm_mul_ss( rsqt, x ) );</span>
  108. <a name="l00069"></a>00069 <span class="comment"> _mm_store_ss( &amp;vOut[1] , _mm_mul_ss( rsqt, y ) );</span>
  109. <a name="l00070"></a>00070 <span class="comment"> _mm_store_ss( &amp;vOut[2] , _mm_mul_ss( rsqt, z ) );</span>
  110. <a name="l00071"></a>00071 <span class="comment"> </span>
  111. <a name="l00072"></a>00072 <span class="comment"> return _mm_mul_ss( l , rsqt );</span>
  112. <a name="l00073"></a>00073 <span class="comment">}</span>
  113. <a name="l00074"></a>00074 <span class="comment">*/</span>
  114. <a name="l00075"></a>00075 }<span class="comment">//namespace detail</span>
  115. <a name="l00076"></a>00076 }<span class="comment">//namespace glm</span>
  116. <a name="l00077"></a>00077
  117. <a name="l00078"></a>00078 <span class="preprocessor">#endif//GLM_ARCH</span>
  118. <a name="l00079"></a>00079 <span class="preprocessor"></span><span class="preprocessor">#endif//glm_detail_intrinsic_exponential</span>
  119. </pre></div></div>
  120. </div>
  121. <hr class="footer"/><address class="footer"><small>
  122. Generated by &#160;<a href="http://www.doxygen.org/index.html">
  123. <img class="footer" src="doxygen.png" alt="doxygen"/>
  124. </a> 1.7.5.1
  125. </small></address>
  126. </body>
  127. </html>