gtx-simd-mat4.cpp 7.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289
  1. ///////////////////////////////////////////////////////////////////////////////////////////////////
  2. // OpenGL Mathematics Copyright (c) 2005 - 2011 G-Truc Creation (www.g-truc.net)
  3. ///////////////////////////////////////////////////////////////////////////////////////////////////
  4. // Created : 2010-09-16
  5. // Updated : 2010-09-16
  6. // Licence : This source is under MIT licence
  7. // File : test/gtx/simd-mat4.cpp
  8. ///////////////////////////////////////////////////////////////////////////////////////////////////
  9. #include <glm/glm.hpp>
  10. #include <glm/gtc/matrix_transform.hpp>
  11. #include <glm/gtc/quaternion.hpp>
  12. #include <glm/gtx/simd_vec4.hpp>
  13. #include <glm/gtx/simd_mat4.hpp>
  14. #include <glm/gtx/random.hpp>
  15. #include <iostream>
  16. #include <cstdio>
  17. #include <ctime>
  18. #include <vector>
  19. std::vector<float> test_detA(std::vector<glm::mat4> const & Data)
  20. {
  21. std::vector<float> Test(Data.size());
  22. std::clock_t TimeStart = clock();
  23. for(std::size_t i = 0; i < Test.size() - 1; ++i)
  24. Test[i] = glm::determinant(Data[i]);
  25. std::clock_t TimeEnd = clock();
  26. printf("Det A: %ld\n", TimeEnd - TimeStart);
  27. return Test;
  28. }
  29. std::vector<float> test_detB(std::vector<glm::mat4> const & Data)
  30. {
  31. std::vector<float> Test(Data.size());
  32. std::clock_t TimeStart = clock();
  33. for(std::size_t i = 0; i < Test.size() - 1; ++i)
  34. {
  35. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  36. glm::simdMat4 m(Data[i]);
  37. glm::simdVec4 d(glm::detail::sse_slow_det_ps((__m128 const * const)&m));
  38. glm::vec4 v;//(d);
  39. Test[i] = v.x;
  40. }
  41. std::clock_t TimeEnd = clock();
  42. printf("Det B: %ld\n", TimeEnd - TimeStart);
  43. return Test;
  44. }
  45. std::vector<float> test_detC(std::vector<glm::mat4> const & Data)
  46. {
  47. std::vector<float> Test(Data.size());
  48. std::clock_t TimeStart = clock();
  49. for(std::size_t i = 0; i < Test.size() - 1; ++i)
  50. {
  51. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  52. glm::simdMat4 m(Data[i]);
  53. glm::simdVec4 d(glm::detail::sse_det_ps((__m128 const * const)&m));
  54. glm::vec4 v;//(d);
  55. Test[i] = v.x;
  56. }
  57. std::clock_t TimeEnd = clock();
  58. printf("Det C: %ld\n", TimeEnd - TimeStart);
  59. return Test;
  60. }
  61. std::vector<float> test_detD(std::vector<glm::mat4> const & Data)
  62. {
  63. std::vector<float> Test(Data.size());
  64. std::clock_t TimeStart = clock();
  65. for(std::size_t i = 0; i < Test.size() - 1; ++i)
  66. {
  67. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  68. glm::simdMat4 m(Data[i]);
  69. glm::simdVec4 d(glm::detail::sse_detd_ps((__m128 const * const)&m));
  70. glm::vec4 v;//(d);
  71. Test[i] = v.x;
  72. }
  73. std::clock_t TimeEnd = clock();
  74. printf("Det D: %ld\n", TimeEnd - TimeStart);
  75. return Test;
  76. }
  77. void test_invA(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  78. {
  79. //std::vector<float> Test(Data.size());
  80. Out.resize(Data.size());
  81. std::clock_t TimeStart = clock();
  82. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  83. {
  84. Out[i] = glm::inverse(Data[i]);
  85. }
  86. std::clock_t TimeEnd = clock();
  87. printf("Inv A: %ld\n", TimeEnd - TimeStart);
  88. }
  89. void test_invC(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  90. {
  91. //std::vector<float> Test(Data.size());
  92. Out.resize(Data.size());
  93. std::clock_t TimeStart = clock();
  94. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  95. {
  96. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  97. glm::simdMat4 m(Data[i]);
  98. glm::simdMat4 o;
  99. glm::detail::sse_inverse_fast_ps((__m128 const * const)&m, (__m128 *)&o);
  100. Out[i] = *(glm::mat4*)&o;
  101. }
  102. std::clock_t TimeEnd = clock();
  103. printf("Inv C: %ld\n", TimeEnd - TimeStart);
  104. }
  105. void test_invD(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  106. {
  107. //std::vector<float> Test(Data.size());
  108. Out.resize(Data.size());
  109. std::clock_t TimeStart = clock();
  110. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  111. {
  112. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  113. glm::simdMat4 m(Data[i]);
  114. glm::simdMat4 o;
  115. glm::detail::sse_inverse_ps((__m128 const * const)&m, (__m128 *)&o);
  116. Out[i] = *(glm::mat4*)&o;
  117. }
  118. std::clock_t TimeEnd = clock();
  119. printf("Inv D: %ld\n", TimeEnd - TimeStart);
  120. }
  121. void test_mulA(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  122. {
  123. //std::vector<float> Test(Data.size());
  124. Out.resize(Data.size());
  125. std::clock_t TimeStart = clock();
  126. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  127. {
  128. Out[i] = Data[i] * Data[i];
  129. }
  130. std::clock_t TimeEnd = clock();
  131. printf("Mul A: %ld\n", TimeEnd - TimeStart);
  132. }
  133. void test_mulD(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  134. {
  135. //std::vector<float> Test(Data.size());
  136. Out.resize(Data.size());
  137. std::clock_t TimeStart = clock();
  138. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  139. {
  140. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  141. glm::simdMat4 m(Data[i]);
  142. glm::detail::sse_mul_ps((__m128 const * const)&m, (__m128 const * const)&m, (__m128*)&Out[i]);
  143. }
  144. std::clock_t TimeEnd = clock();
  145. printf("Mul D: %ld\n", TimeEnd - TimeStart);
  146. }
  147. int test_compute_glm()
  148. {
  149. return 0;
  150. }
  151. int test_compute_gtx()
  152. {
  153. std::vector<glm::vec4> Output(1000000);
  154. std::clock_t TimeStart = clock();
  155. for(std::size_t k = 0; k < Output.size(); ++k)
  156. {
  157. float i = float(k) / 1000.f;
  158. glm::vec3 A = glm::normalize(glm::vec3(i));
  159. glm::vec3 B = glm::cross(A, glm::vec3(0, 0, 1));
  160. glm::mat4 C = glm::rotate(glm::mat4(1.0f), i, B);
  161. glm::mat4 D = glm::scale(C, glm::vec3(0.8f, 1.0f, 1.2f));
  162. glm::mat4 E = glm::translate(D, glm::vec3(1.4f, 1.2f, 1.1f));
  163. glm::mat4 F = glm::perspective(i, 1.5f, 0.1f, 1000.f);
  164. glm::mat4 G = glm::inverse(F * E);
  165. glm::vec3 H = glm::unProject(glm::vec3(i), G, F, E[3]);
  166. glm::vec3 I = glm::project(H, G, F, E[3]);
  167. glm::mat4 J = glm::lookAt(glm::normalize(B), H, I);
  168. glm::mat4 K = glm::transpose(J);
  169. glm::quat L = glm::normalize(glm::quat_cast(K));
  170. glm::vec4 M = L * glm::smoothstep(K[3], J[3], glm::vec4(i));
  171. glm::mat4 N = glm::mat4(glm::normalize(M), K[3], J[3], glm::vec4(i));
  172. glm::mat4 O = N * glm::inverse(N);
  173. glm::vec4 P = O * glm::reflect(N[3], glm::vec4(A, 1.0f));
  174. glm::vec4 Q = glm::vec4(glm::dot(M, P));
  175. glm::vec4 R = glm::quat(Q.w, glm::vec3(Q)) * P;
  176. Output[k] = R;
  177. }
  178. std::clock_t TimeEnd = clock();
  179. printf("test_compute_gtx: %ld\n", TimeEnd - TimeStart);
  180. return Output.size() != 0;
  181. }
  182. int main()
  183. {
  184. int Failed = GLM_COMPILER;
  185. std::vector<glm::mat4> Data(1024 * 1024 * 8);
  186. for(std::size_t i = 0; i < Data.size(); ++i)
  187. Data[i] = glm::mat4(
  188. glm::vec4(glm::compRand4(-2.0f, 2.0f)),
  189. glm::vec4(glm::compRand4(-2.0f, 2.0f)),
  190. glm::vec4(glm::compRand4(-2.0f, 2.0f)),
  191. glm::vec4(glm::compRand4(-2.0f, 2.0f)));
  192. {
  193. std::vector<glm::mat4> TestInvA;
  194. test_invA(Data, TestInvA);
  195. }
  196. {
  197. std::vector<glm::mat4> TestInvC;
  198. test_invC(Data, TestInvC);
  199. }
  200. {
  201. std::vector<glm::mat4> TestInvD;
  202. test_invD(Data, TestInvD);
  203. }
  204. {
  205. std::vector<glm::mat4> TestA;
  206. test_mulA(Data, TestA);
  207. }
  208. {
  209. std::vector<glm::mat4> TestD;
  210. test_mulD(Data, TestD);
  211. }
  212. {
  213. std::vector<float> TestDetA = test_detA(Data);
  214. std::vector<float> TestDetB = test_detB(Data);
  215. std::vector<float> TestDetD = test_detD(Data);
  216. std::vector<float> TestDetC = test_detC(Data);
  217. for(std::size_t i = 0; i < TestDetA.size(); ++i)
  218. if(TestDetA[i] != TestDetB[i] && TestDetC[i] != TestDetB[i] && TestDetC[i] != TestDetD[i])
  219. return 1;
  220. }
  221. // shuffle test
  222. glm::simdVec4 A(1.0f, 2.0f, 3.0f, 4.0f);
  223. glm::simdVec4 B(5.0f, 6.0f, 7.0f, 8.0f);
  224. __m128 C = _mm_shuffle_ps(A.Data, B.Data, _MM_SHUFFLE(1, 0, 1, 0));
  225. Failed += test_compute_glm();
  226. Failed += test_compute_gtx();
  227. float Det = glm::determinant(glm::simdMat4(1.0));
  228. glm::simdMat4 D = glm::matrixCompMult(glm::simdMat4(1.0), glm::simdMat4(1.0));
  229. system("pause");
  230. return Failed;
  231. }