gtx_simd_mat4.cpp 7.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302
  1. ///////////////////////////////////////////////////////////////////////////////////////////////////
  2. // OpenGL Mathematics Copyright (c) 2005 - 2011 G-Truc Creation (www.g-truc.net)
  3. ///////////////////////////////////////////////////////////////////////////////////////////////////
  4. // Created : 2010-09-16
  5. // Updated : 2010-09-16
  6. // Licence : This source is under MIT licence
  7. // File : test/gtx/simd-mat4.cpp
  8. ///////////////////////////////////////////////////////////////////////////////////////////////////
  9. #include <glm/glm.hpp>
  10. #include <glm/gtc/matrix_transform.hpp>
  11. #include <glm/gtc/quaternion.hpp>
  12. #include <glm/gtx/random.hpp>
  13. #include <glm/gtx/simd_vec4.hpp>
  14. #include <glm/gtx/simd_mat4.hpp>
  15. #include <iostream>
  16. #include <cstdio>
  17. #include <ctime>
  18. #include <vector>
  19. #if(GLM_ARCH != GLM_ARCH_PURE)
  20. std::vector<float> test_detA(std::vector<glm::mat4> const & Data)
  21. {
  22. std::vector<float> Test(Data.size());
  23. std::clock_t TimeStart = clock();
  24. for(std::size_t i = 0; i < Test.size() - 1; ++i)
  25. Test[i] = glm::determinant(Data[i]);
  26. std::clock_t TimeEnd = clock();
  27. printf("Det A: %ld\n", TimeEnd - TimeStart);
  28. return Test;
  29. }
  30. std::vector<float> test_detB(std::vector<glm::mat4> const & Data)
  31. {
  32. std::vector<float> Test(Data.size());
  33. std::clock_t TimeStart = clock();
  34. for(std::size_t i = 0; i < Test.size() - 1; ++i)
  35. {
  36. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  37. glm::simdMat4 m(Data[i]);
  38. glm::simdVec4 d(glm::detail::sse_slow_det_ps((__m128 const * const)&m));
  39. glm::vec4 v;//(d);
  40. Test[i] = v.x;
  41. }
  42. std::clock_t TimeEnd = clock();
  43. printf("Det B: %ld\n", TimeEnd - TimeStart);
  44. return Test;
  45. }
  46. std::vector<float> test_detC(std::vector<glm::mat4> const & Data)
  47. {
  48. std::vector<float> Test(Data.size());
  49. std::clock_t TimeStart = clock();
  50. for(std::size_t i = 0; i < Test.size() - 1; ++i)
  51. {
  52. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  53. glm::simdMat4 m(Data[i]);
  54. glm::simdVec4 d(glm::detail::sse_det_ps((__m128 const * const)&m));
  55. glm::vec4 v;//(d);
  56. Test[i] = v.x;
  57. }
  58. std::clock_t TimeEnd = clock();
  59. printf("Det C: %ld\n", TimeEnd - TimeStart);
  60. return Test;
  61. }
  62. std::vector<float> test_detD(std::vector<glm::mat4> const & Data)
  63. {
  64. std::vector<float> Test(Data.size());
  65. std::clock_t TimeStart = clock();
  66. for(std::size_t i = 0; i < Test.size() - 1; ++i)
  67. {
  68. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  69. glm::simdMat4 m(Data[i]);
  70. glm::simdVec4 d(glm::detail::sse_detd_ps((__m128 const * const)&m));
  71. glm::vec4 v;//(d);
  72. Test[i] = v.x;
  73. }
  74. std::clock_t TimeEnd = clock();
  75. printf("Det D: %ld\n", TimeEnd - TimeStart);
  76. return Test;
  77. }
  78. void test_invA(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  79. {
  80. //std::vector<float> Test(Data.size());
  81. Out.resize(Data.size());
  82. std::clock_t TimeStart = clock();
  83. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  84. {
  85. Out[i] = glm::inverse(Data[i]);
  86. }
  87. std::clock_t TimeEnd = clock();
  88. printf("Inv A: %ld\n", TimeEnd - TimeStart);
  89. }
  90. void test_invC(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  91. {
  92. //std::vector<float> Test(Data.size());
  93. Out.resize(Data.size());
  94. std::clock_t TimeStart = clock();
  95. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  96. {
  97. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  98. glm::simdMat4 m(Data[i]);
  99. glm::simdMat4 o;
  100. glm::detail::sse_inverse_fast_ps((__m128 const * const)&m, (__m128 *)&o);
  101. Out[i] = *(glm::mat4*)&o;
  102. }
  103. std::clock_t TimeEnd = clock();
  104. printf("Inv C: %ld\n", TimeEnd - TimeStart);
  105. }
  106. void test_invD(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  107. {
  108. //std::vector<float> Test(Data.size());
  109. Out.resize(Data.size());
  110. std::clock_t TimeStart = clock();
  111. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  112. {
  113. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  114. glm::simdMat4 m(Data[i]);
  115. glm::simdMat4 o;
  116. glm::detail::sse_inverse_ps((__m128 const * const)&m, (__m128 *)&o);
  117. Out[i] = *(glm::mat4*)&o;
  118. }
  119. std::clock_t TimeEnd = clock();
  120. printf("Inv D: %ld\n", TimeEnd - TimeStart);
  121. }
  122. void test_mulA(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  123. {
  124. //std::vector<float> Test(Data.size());
  125. Out.resize(Data.size());
  126. std::clock_t TimeStart = clock();
  127. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  128. {
  129. Out[i] = Data[i] * Data[i];
  130. }
  131. std::clock_t TimeEnd = clock();
  132. printf("Mul A: %ld\n", TimeEnd - TimeStart);
  133. }
  134. void test_mulD(std::vector<glm::mat4> const & Data, std::vector<glm::mat4> & Out)
  135. {
  136. //std::vector<float> Test(Data.size());
  137. Out.resize(Data.size());
  138. std::clock_t TimeStart = clock();
  139. for(std::size_t i = 0; i < Out.size() - 1; ++i)
  140. {
  141. _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0);
  142. glm::simdMat4 m(Data[i]);
  143. glm::detail::sse_mul_ps((__m128 const * const)&m, (__m128 const * const)&m, (__m128*)&Out[i]);
  144. }
  145. std::clock_t TimeEnd = clock();
  146. printf("Mul D: %ld\n", TimeEnd - TimeStart);
  147. }
  148. int test_compute_glm()
  149. {
  150. return 0;
  151. }
  152. int test_compute_gtx()
  153. {
  154. std::vector<glm::vec4> Output(1000000);
  155. std::clock_t TimeStart = clock();
  156. for(std::size_t k = 0; k < Output.size(); ++k)
  157. {
  158. float i = float(k) / 1000.f;
  159. glm::vec3 A = glm::normalize(glm::vec3(i));
  160. glm::vec3 B = glm::cross(A, glm::vec3(0, 0, 1));
  161. glm::mat4 C = glm::rotate(glm::mat4(1.0f), i, B);
  162. glm::mat4 D = glm::scale(C, glm::vec3(0.8f, 1.0f, 1.2f));
  163. glm::mat4 E = glm::translate(D, glm::vec3(1.4f, 1.2f, 1.1f));
  164. glm::mat4 F = glm::perspective(i, 1.5f, 0.1f, 1000.f);
  165. glm::mat4 G = glm::inverse(F * E);
  166. glm::vec3 H = glm::unProject(glm::vec3(i), G, F, E[3]);
  167. glm::vec3 I = glm::project(H, G, F, E[3]);
  168. glm::mat4 J = glm::lookAt(glm::normalize(B), H, I);
  169. glm::mat4 K = glm::transpose(J);
  170. glm::quat L = glm::normalize(glm::quat_cast(K));
  171. glm::vec4 M = L * glm::smoothstep(K[3], J[3], glm::vec4(i));
  172. glm::mat4 N = glm::mat4(glm::normalize(M), K[3], J[3], glm::vec4(i));
  173. glm::mat4 O = N * glm::inverse(N);
  174. glm::vec4 P = O * glm::reflect(N[3], glm::vec4(A, 1.0f));
  175. glm::vec4 Q = glm::vec4(glm::dot(M, P));
  176. glm::vec4 R = glm::quat(Q.w, glm::vec3(Q)) * P;
  177. Output[k] = R;
  178. }
  179. std::clock_t TimeEnd = clock();
  180. printf("test_compute_gtx: %ld\n", TimeEnd - TimeStart);
  181. return 0;
  182. }
  183. int main()
  184. {
  185. int Error = 0;
  186. std::vector<glm::mat4> Data(64 * 64 * 1);
  187. for(std::size_t i = 0; i < Data.size(); ++i)
  188. Data[i] = glm::mat4(
  189. glm::vec4(glm::compRand4(-2.0f, 2.0f)),
  190. glm::vec4(glm::compRand4(-2.0f, 2.0f)),
  191. glm::vec4(glm::compRand4(-2.0f, 2.0f)),
  192. glm::vec4(glm::compRand4(-2.0f, 2.0f)));
  193. {
  194. std::vector<glm::mat4> TestInvA;
  195. test_invA(Data, TestInvA);
  196. }
  197. {
  198. std::vector<glm::mat4> TestInvC;
  199. test_invC(Data, TestInvC);
  200. }
  201. {
  202. std::vector<glm::mat4> TestInvD;
  203. test_invD(Data, TestInvD);
  204. }
  205. {
  206. std::vector<glm::mat4> TestA;
  207. test_mulA(Data, TestA);
  208. }
  209. {
  210. std::vector<glm::mat4> TestD;
  211. test_mulD(Data, TestD);
  212. }
  213. {
  214. std::vector<float> TestDetA = test_detA(Data);
  215. std::vector<float> TestDetB = test_detB(Data);
  216. std::vector<float> TestDetD = test_detD(Data);
  217. std::vector<float> TestDetC = test_detC(Data);
  218. for(std::size_t i = 0; i < TestDetA.size(); ++i)
  219. if(TestDetA[i] != TestDetB[i] && TestDetC[i] != TestDetB[i] && TestDetC[i] != TestDetD[i])
  220. return 1;
  221. }
  222. // shuffle test
  223. glm::simdVec4 A(1.0f, 2.0f, 3.0f, 4.0f);
  224. glm::simdVec4 B(5.0f, 6.0f, 7.0f, 8.0f);
  225. //__m128 C = _mm_shuffle_ps(A.Data, B.Data, _MM_SHUFFLE(1, 0, 1, 0));
  226. Error += test_compute_glm();
  227. Error += test_compute_gtx();
  228. float Det = glm::determinant(glm::simdMat4(1.0));
  229. Error += Det == 1.0f ? 0 : 1;
  230. glm::simdMat4 D = glm::matrixCompMult(glm::simdMat4(1.0), glm::simdMat4(1.0));
  231. return Error;
  232. }
  233. #else
  234. int main()
  235. {
  236. int Error = 0;
  237. return Error;
  238. }
  239. #endif//(GLM_ARCH != GLM_ARCH_PURE)