core_setup_simd.cpp 6.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171
  1. #define GLM_FORCE_INLINE
  2. #include <glm/ext/matrix_float4x4.hpp>
  3. #include <glm/ext/matrix_transform.hpp>
  4. #include <glm/ext/vector_float4.hpp>
  5. #if GLM_CONFIG_SIMD == GLM_ENABLE
  6. #include <glm/gtc/type_aligned.hpp>
  7. #include <vector>
  8. #include <chrono>
  9. #include <cstdio>
  10. template <typename matType, typename vecType>
  11. static void test_mat_mul_vec(matType const& M, std::vector<vecType> const& I, std::vector<vecType>& O)
  12. {
  13. typedef typename vecType::value_type T;
  14. for (std::size_t i = 0, n = I.size(); i < n; ++i)
  15. O[i] = M * I[i];
  16. }
  17. template <typename matType, typename vecType>
  18. static int launch_mat_mul_vec(std::size_t Samples)
  19. {
  20. typedef typename vecType::value_type T;
  21. static const matType Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16);
  22. {
  23. std::vector<vecType> I(Samples);
  24. std::vector<vecType> O(Samples);
  25. for(std::size_t i = 0; i < Samples; ++i)
  26. I[i] = vecType(static_cast<T>(i)) * vecType(0.01, 0.02, 0.03, 0.05);
  27. std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now();
  28. test_mat_mul_vec<matType, vecType>(Transform, I, O);
  29. std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now();
  30. return static_cast<int>(std::chrono::duration_cast<std::chrono::microseconds>(t2 - t1).count());
  31. }
  32. }
  33. template <typename matType, typename vecType>
  34. static void test_vec_mul_mat(matType const& M, std::vector<vecType> const& I, std::vector<vecType>& O)
  35. {
  36. typedef typename vecType::value_type T;
  37. for (std::size_t i = 0, n = I.size(); i < n; ++i)
  38. O[i] = I[i] * M;
  39. }
  40. template <typename matType, typename vecType>
  41. static int launch_vec_mul_mat(std::size_t Samples)
  42. {
  43. typedef typename vecType::value_type T;
  44. static const matType Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16);
  45. std::vector<vecType> I(Samples);
  46. std::vector<vecType> O(Samples);
  47. for(std::size_t i = 0; i < Samples; ++i)
  48. I[i] = vecType(static_cast<T>(i)) * vecType(0.01, 0.02, 0.03, 0.05);
  49. std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now();
  50. test_mat_mul_vec<matType, vecType>(Transform, I, O);
  51. std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now();
  52. return static_cast<int>(std::chrono::duration_cast<std::chrono::microseconds>(t2 - t1).count());
  53. }
  54. template <typename matType>
  55. static void test_mat_mul_mat(matType const& M, std::vector<matType> const& I, std::vector<matType>& O)
  56. {
  57. typedef typename matType::value_type T;
  58. for (std::size_t i = 0, n = I.size(); i < n; ++i)
  59. O[i] = M * I[i];
  60. }
  61. template <typename matType>
  62. static int launch_mat_mul_mat(std::size_t Samples)
  63. {
  64. typedef typename matType::value_type T;
  65. static const matType Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16);
  66. {
  67. std::vector<matType> I(Samples);
  68. std::vector<matType> O(Samples);
  69. for(std::size_t i = 0; i < Samples; ++i)
  70. I[i] = matType(static_cast<T>(i)) * matType(0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05);
  71. std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now();
  72. test_mat_mul_mat<matType>(Transform, I, O);
  73. std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now();
  74. return static_cast<int>(std::chrono::duration_cast<std::chrono::microseconds>(t2 - t1).count());
  75. }
  76. }
  77. template <typename matType>
  78. static void test_mat_div_mat(matType const& M, std::vector<matType> const& I, std::vector<matType>& O)
  79. {
  80. typedef typename matType::value_type T;
  81. for (std::size_t i = 0, n = I.size(); i < n; ++i)
  82. O[i] = M / I[i];
  83. }
  84. template <typename matType>
  85. static int launch_mat_div_mat(std::size_t Samples)
  86. {
  87. typedef typename matType::value_type T;
  88. static const matType Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16);
  89. {
  90. std::vector<matType> I(Samples);
  91. std::vector<matType> O(Samples);
  92. for(std::size_t i = 0; i < Samples; ++i)
  93. I[i] = matType(static_cast<T>(i)) * matType(0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05);
  94. std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now();
  95. test_mat_div_mat<matType>(Transform, I, O);
  96. std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now();
  97. return static_cast<int>(std::chrono::duration_cast<std::chrono::microseconds>(t2 - t1).count());
  98. }
  99. }
  100. int main()
  101. {
  102. std::size_t const Samples = 50000;
  103. printf("\nmat4 * vec4\n");
  104. printf("- dmat4 * dvec4 duration %d us\n", launch_mat_mul_vec<glm::dmat4, glm::dvec4>(Samples));
  105. printf("- dmat4 * dvec4 (SIMD) duration %d us\n", launch_mat_mul_vec<glm::aligned_dmat4, glm::aligned_dvec4>(Samples));
  106. printf("- mat4 * vec4 duration %d us\n", launch_mat_mul_vec<glm::mat4, glm::vec4>(Samples));
  107. printf("- mat4 * vec4 (SIMD) duration %d us\n", launch_mat_mul_vec<glm::aligned_mat4, glm::aligned_vec4>(Samples));
  108. printf("\nvec4 * mat4\n");
  109. printf("- dvec4 * dmat4 duration %d us\n", launch_vec_mul_mat<glm::dmat4, glm::dvec4>(Samples));
  110. printf("- dvec4 * dmat4 (SIMD) duration %d us\n", launch_vec_mul_mat<glm::aligned_dmat4, glm::aligned_dvec4>(Samples));
  111. printf("- vec4 * mat4 duration %d us\n", launch_vec_mul_mat<glm::mat4, glm::vec4>(Samples));
  112. printf("- vec4 * mat4 (SIMD) duration %d us\n", launch_vec_mul_mat<glm::aligned_mat4, glm::aligned_vec4>(Samples));
  113. printf("\nmat4 * mat4\n");
  114. printf("- dmat4 * dmat4 duration %d us\n", launch_mat_mul_mat<glm::dmat4>(Samples));
  115. printf("- dmat4 * dmat4 (SIMD) duration %d us\n", launch_mat_mul_mat<glm::aligned_dmat4>(Samples));
  116. printf("- mat4 * mat4 duration %d us\n", launch_mat_mul_mat<glm::mat4>(Samples));
  117. printf("- mat4 * mat4 (SIMD) duration %d us\n", launch_mat_mul_mat<glm::aligned_mat4>(Samples));
  118. printf("\nmat4 / mat4\n");
  119. printf("- dmat4 / dmat4 duration %d us\n", launch_mat_div_mat<glm::dmat4>(Samples));
  120. printf("- dmat4 / dmat4 (SIMD) duration %d us\n", launch_mat_div_mat<glm::aligned_dmat4>(Samples));
  121. printf("- mat4 / mat4 duration %d us\n", launch_mat_div_mat<glm::mat4>(Samples));
  122. printf("- mat4 / mat4 (SIMD) duration %d us\n", launch_mat_div_mat<glm::aligned_mat4>(Samples));
  123. return 0;
  124. }
  125. #else
  126. int main()
  127. {
  128. return 0;
  129. }
  130. #endif