gtx_simd_mat4.cpp 7.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304
  1. ///////////////////////////////////////////////////////////////////////////////////////////////////
  2. // OpenGL Mathematics Copyright (c) 2005 - 2013 G-Truc Creation (www.g-truc.net)
  3. ///////////////////////////////////////////////////////////////////////////////////////////////////
  4. // Created : 2010-09-16
  5. // Updated : 2010-09-16
  6. // Licence : This source is under MIT licence
  7. // File : test/gtx/simd-mat4.cpp
  8. ///////////////////////////////////////////////////////////////////////////////////////////////////
  9. #include <glm/glm.hpp>
  10. #include <glm/gtc/matrix_transform.hpp>
  11. #include <glm/gtc/quaternion.hpp>
  12. #include <glm/gtc/random.hpp>
  13. #include <glm/gtx/simd_vec4.hpp>
  14. #include <glm/gtx/simd_mat4.hpp>
  15. #include <iostream>
  16. #include <cstdio>
  17. #include <ctime>
  18. #include <vector>
  19. #if(GLM_ARCH != GLM_ARCH_PURE)
  20. std::vector<float> test_detA(std::vector<glm::mat4> const & Data)
  21. {
  22. std::vector<float> Test(Data.size());
  23. std::clock_t TimeStart = clock();
  24. for(std::size_t i = 0; i < Test.size() - 1; ++i)
  25. Test[i] = glm::determinant(Data[i]);
  26. std::clock_t TimeEnd = clock();
  27. printf("Det A: %ld\n", TimeEnd - TimeStart);
  28. return Test;
  29. }
  30. std::vector<float> test_detB(std::vector<glm::mat4> const & Data)
  31. {
  32. std::vector<float> Test(Data.size());
  33. std::clock_t TimeStart = clock();
  34. for(std::size_t i = 0; i < Test.size() - 1; ++i)
  35. {
  36. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  37. glm::simdMat4 m(Data[i]);
  38. glm::simdVec4 d(glm::detail::sse_slow_det_ps((__m128 const * const)&m));
  39. glm::vec4 v;//(d);
  40. Test[i] = v.x;
  41. }
  42. std::clock_t TimeEnd = clock();
  43. printf("Det B: %ld\n", TimeEnd - TimeStart);
  44. return Test;
  45. }
  46. std::vector<float> test_detC(std::vector<glm::mat4> const & Data)
  47. {
  48. std::vector<float> Test(Data.size());
  49. std::clock_t TimeStart = clock();
  50. for(std::size_t i = 0; i < Test.size() - 1; ++i)
  51. {
  52. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  53. glm::simdMat4 m(Data[i]);
  54. glm::simdVec4 d(glm::detail::sse_det_ps((__m128 const * const)&m));
  55. glm::vec4 v;//(d);
  56. Test[i] = v.x;
  57. }
  58. std::clock_t TimeEnd = clock();
  59. printf("Det C: %ld\n", TimeEnd - TimeStart);
  60. return Test;
  61. }
  62. std::vector<float> test_detD(std::vector<glm::mat4> const & Data)
  63. {
  64. std::vector<float> Test(Data.size());
  65. std::clock_t TimeStart = clock();
  66. for(std::size_t i = 0; i < Test.size() - 1; ++i)
  67. {
  68. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  69. glm::simdMat4 m(Data[i]);
  70. glm::simdVec4 d(glm::detail::sse_detd_ps((__m128 const * const)&m));
  71. glm::vec4 v;//(d);
  72. Test[i] = v.x;
  73. }
  74. std::clock_t TimeEnd = clock();
  75. printf("Det D: %ld\n", TimeEnd - TimeStart);
  76. return Test;
  77. }
  78. void test_invA(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  79. {
  80. //std::vector<float> Test(Data.size());
  81. Out.resize(Data.size());
  82. std::clock_t TimeStart = clock();
  83. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  84. {
  85. Out[i] = glm::inverse(Data[i]);
  86. }
  87. std::clock_t TimeEnd = clock();
  88. printf("Inv A: %ld\n", TimeEnd - TimeStart);
  89. }
  90. void test_invC(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  91. {
  92. //std::vector<float> Test(Data.size());
  93. Out.resize(Data.size());
  94. std::clock_t TimeStart = clock();
  95. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  96. {
  97. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  98. glm::simdMat4 m(Data[i]);
  99. glm::simdMat4 o;
  100. glm::detail::sse_inverse_fast_ps((__m128 const * const)&m, (__m128 *)&o);
  101. Out[i] = *(glm::mat4*)&o;
  102. }
  103. std::clock_t TimeEnd = clock();
  104. printf("Inv C: %ld\n", TimeEnd - TimeStart);
  105. }
  106. void test_invD(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  107. {
  108. //std::vector<float> Test(Data.size());
  109. Out.resize(Data.size());
  110. std::clock_t TimeStart = clock();
  111. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  112. {
  113. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  114. glm::simdMat4 m(Data[i]);
  115. glm::simdMat4 o;
  116. glm::detail::sse_inverse_ps((__m128 const * const)&m, (__m128 *)&o);
  117. Out[i] = *(glm::mat4*)&o;
  118. }
  119. std::clock_t TimeEnd = clock();
  120. printf("Inv D: %ld\n", TimeEnd - TimeStart);
  121. }
  122. void test_mulA(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  123. {
  124. //std::vector<float> Test(Data.size());
  125. Out.resize(Data.size());
  126. std::clock_t TimeStart = clock();
  127. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  128. {
  129. Out[i] = Data[i] * Data[i];
  130. }
  131. std::clock_t TimeEnd = clock();
  132. printf("Mul A: %ld\n", TimeEnd - TimeStart);
  133. }
  134. void test_mulD(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  135. {
  136. //std::vector<float> Test(Data.size());
  137. Out.resize(Data.size());
  138. std::clock_t TimeStart = clock();
  139. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  140. {
  141. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  142. glm::simdMat4 m(Data[i]);
  143. glm::simdMat4 o;
  144. glm::detail::sse_mul_ps((__m128 const * const)&m, (__m128 const * const)&m, (__m128*)&o);
  145. Out[i] = *(glm::mat4*)&o;
  146. }
  147. std::clock_t TimeEnd = clock();
  148. printf("Mul D: %ld\n", TimeEnd - TimeStart);
  149. }
  150. int test_compute_glm()
  151. {
  152. return 0;
  153. }
  154. int test_compute_gtx()
  155. {
  156. std::vector<glm::vec4> Output(1000000);
  157. std::clock_t TimeStart = clock();
  158. for(std::size_t k = 0; k < Output.size(); ++k)
  159. {
  160. float i = float(k) / 1000.f + 0.001f;
  161. glm::vec3 A = glm::normalize(glm::vec3(i));
  162. glm::vec3 B = glm::cross(A, glm::normalize(glm::vec3(1, 1, 2)));
  163. glm::mat4 C = glm::rotate(glm::mat4(1.0f), i, B);
  164. glm::mat4 D = glm::scale(C, glm::vec3(0.8f, 1.0f, 1.2f));
  165. glm::mat4 E = glm::translate(D, glm::vec3(1.4f, 1.2f, 1.1f));
  166. glm::mat4 F = glm::perspective(i, 1.5f, 0.1f, 1000.f);
  167. glm::mat4 G = glm::inverse(F * E);
  168. glm::vec3 H = glm::unProject(glm::vec3(i), G, F, E[3]);
  169. glm::vec3 I = glm::any(glm::isnan(glm::project(H, G, F, E[3]))) ? glm::vec3(2) : glm::vec3(1);
  170. glm::mat4 J = glm::lookAt(glm::normalize(glm::max(B, glm::vec3(0.001f))), H, I);
  171. glm::mat4 K = glm::transpose(J);
  172. glm::quat L = glm::normalize(glm::quat_cast(K));
  173. glm::vec4 M = L * glm::smoothstep(K[3], J[3], glm::vec4(i));
  174. glm::mat4 N = glm::mat4(glm::normalize(glm::max(M, glm::vec4(0.001f))), K[3], J[3], glm::vec4(i));
  175. glm::mat4 O = N * glm::inverse(N);
  176. glm::vec4 P = O * glm::reflect(N[3], glm::vec4(A, 1.0f));
  177. glm::vec4 Q = glm::vec4(glm::dot(M, P));
  178. glm::vec4 R = glm::quat(Q.w, glm::vec3(Q)) * P;
  179. Output[k] = R;
  180. }
  181. std::clock_t TimeEnd = clock();
  182. printf("test_compute_gtx: %ld\n", TimeEnd - TimeStart);
  183. return 0;
  184. }
  185. int main()
  186. {
  187. int Error = 0;
  188. std::vector<glm::mat4> Data(64 * 64 * 1);
  189. for(std::size_t i = 0; i < Data.size(); ++i)
  190. Data[i] = glm::mat4(
  191. glm::vec4(glm::linearRand(glm::vec4(-2.0f), glm::vec4(2.0f))),
  192. glm::vec4(glm::linearRand(glm::vec4(-2.0f), glm::vec4(2.0f))),
  193. glm::vec4(glm::linearRand(glm::vec4(-2.0f), glm::vec4(2.0f))),
  194. glm::vec4(glm::linearRand(glm::vec4(-2.0f), glm::vec4(2.0f))));
  195. {
  196. std::vector<glm::mat4> TestInvA;
  197. test_invA(Data, TestInvA);
  198. }
  199. {
  200. std::vector<glm::mat4> TestInvC;
  201. test_invC(Data, TestInvC);
  202. }
  203. {
  204. std::vector<glm::mat4> TestInvD;
  205. test_invD(Data, TestInvD);
  206. }
  207. {
  208. std::vector<glm::mat4> TestA;
  209. test_mulA(Data, TestA);
  210. }
  211. {
  212. std::vector<glm::mat4> TestD;
  213. test_mulD(Data, TestD);
  214. }
  215. {
  216. std::vector<float> TestDetA = test_detA(Data);
  217. std::vector<float> TestDetB = test_detB(Data);
  218. std::vector<float> TestDetD = test_detD(Data);
  219. std::vector<float> TestDetC = test_detC(Data);
  220. for(std::size_t i = 0; i < TestDetA.size(); ++i)
  221. if(TestDetA[i] != TestDetB[i] && TestDetC[i] != TestDetB[i] && TestDetC[i] != TestDetD[i])
  222. return 1;
  223. }
  224. // shuffle test
  225. glm::simdVec4 A(1.0f, 2.0f, 3.0f, 4.0f);
  226. glm::simdVec4 B(5.0f, 6.0f, 7.0f, 8.0f);
  227. //__m128 C = _mm_shuffle_ps(A.Data, B.Data, _MM_SHUFFLE(1, 0, 1, 0));
  228. Error += test_compute_glm();
  229. Error += test_compute_gtx();
  230. float Det = glm::determinant(glm::simdMat4(1.0));
  231. Error += Det == 1.0f ? 0 : 1;
  232. glm::simdMat4 D = glm::matrixCompMult(glm::simdMat4(1.0), glm::simdMat4(1.0));
  233. return Error;
  234. }
  235. #else
  236. int main()
  237. {
  238. int Error = 0;
  239. return Error;
  240. }
  241. #endif//(GLM_ARCH != GLM_ARCH_PURE)