perf_vector_mul_matrix.cpp 6.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192
  1. #define GLM_FORCE_INLINE
  2. #include <glm/ext/matrix_float2x2.hpp>
  3. #include <glm/ext/matrix_double2x2.hpp>
  4. #include <glm/ext/matrix_float3x3.hpp>
  5. #include <glm/ext/matrix_double3x3.hpp>
  6. #include <glm/ext/matrix_float4x4.hpp>
  7. #include <glm/ext/matrix_double4x4.hpp>
  8. #include <glm/ext/matrix_transform.hpp>
  9. #include <glm/ext/matrix_relational.hpp>
  10. #include <glm/ext/vector_float4.hpp>
  11. #if GLM_CONFIG_SIMD == GLM_ENABLE
  12. #include <glm/gtc/type_aligned.hpp>
  13. #include <vector>
  14. #include <chrono>
  15. #include <cstdio>
  16. template <typename matType, typename vecType, bool reverseOp>
  17. struct test_vec_mul_mat {};
  18. template <typename matType, typename vecType>
  19. struct test_vec_mul_mat< matType, vecType, false>
  20. {
  21. void operator()(matType const& M, std::vector<vecType> const& I, std::vector<vecType>& O)
  22. {
  23. for (std::size_t i = 0, n = I.size(); i < n; ++i)
  24. O[i] = I[i] * M;
  25. }
  26. };
  27. template <typename matType, typename vecType>
  28. struct test_vec_mul_mat< matType, vecType, true>
  29. {
  30. void operator()(matType const& M, std::vector<vecType> const& I, std::vector<vecType>& O)
  31. {
  32. for (std::size_t i = 0, n = I.size(); i < n; ++i)
  33. O[i] = M * I[i];
  34. }
  35. };
  36. template <typename matType, typename vecType, bool reverseOp>
  37. static int launch_vec_mul_mat(std::vector<vecType>& O, matType const& Transform, vecType const& Scale, std::size_t Samples)
  38. {
  39. typedef typename matType::value_type T;
  40. std::vector<vecType> I(Samples);
  41. O.resize(Samples);
  42. memset(I.data(), 0, I.size() * sizeof(vecType));
  43. for(std::size_t i = 0; i < Samples; ++i)
  44. I[i] = Scale * static_cast<T>(i);
  45. std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now();
  46. test_vec_mul_mat<matType, vecType, reverseOp> fct;
  47. fct(Transform, I, O);
  48. std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now();
  49. return static_cast<int>(std::chrono::duration_cast<std::chrono::microseconds>(t2 - t1).count());
  50. }
  51. template <typename packedMatType, typename packedVecType, typename alignedMatType, typename alignedVecType, bool reverseOp>
  52. static int comp_vec2_mul_mat2(std::size_t Samples)
  53. {
  54. typedef typename packedMatType::value_type T;
  55. int Error = 0;
  56. packedMatType const Transform(1, 2, 3, 4);
  57. packedVecType const Scale(0.01, 0.02);
  58. std::vector<packedVecType> SISD;
  59. std::printf("- SISD: %d us\n", launch_vec_mul_mat<packedMatType, packedVecType, reverseOp>(SISD, Transform, Scale, Samples));
  60. std::vector<alignedVecType> SIMD;
  61. std::printf("- SIMD: %d us\n", launch_vec_mul_mat<alignedMatType, alignedVecType, reverseOp>(SIMD, Transform, Scale, Samples));
  62. for(std::size_t i = 0; i < Samples; ++i)
  63. {
  64. packedVecType const A = SISD[i];
  65. packedVecType const B = packedVecType(SIMD[i]);
  66. Error += glm::all(glm::equal(A, B, static_cast<T>(0.001))) ? 0 : 1;
  67. }
  68. return Error;
  69. }
  70. template <typename packedMatType, typename packedVecType, typename alignedMatType, typename alignedVecType, bool reverseOp>
  71. static int comp_vec3_mul_mat3(std::size_t Samples)
  72. {
  73. typedef typename packedMatType::value_type T;
  74. int Error = 0;
  75. packedMatType const Transform(1, 2, 3, 4, 5, 6, 7, 8, 9);
  76. packedVecType const Scale(0.01, 0.02, 0.05);
  77. std::vector<packedVecType> SISD;
  78. std::printf("- SISD: %d us\n", launch_vec_mul_mat<packedMatType, packedVecType, reverseOp>(SISD, Transform, Scale, Samples));
  79. std::vector<alignedVecType> SIMD;
  80. std::printf("- SIMD: %d us\n", launch_vec_mul_mat<alignedMatType, alignedVecType, reverseOp>(SIMD, Transform, Scale, Samples));
  81. for(std::size_t i = 0; i < Samples; ++i)
  82. {
  83. packedVecType const A = SISD[i];
  84. packedVecType const B = SIMD[i];
  85. Error += glm::all(glm::equal(A, B, static_cast<T>(0.001))) ? 0 : 1;
  86. }
  87. return Error;
  88. }
  89. template <typename packedMatType, typename packedVecType, typename alignedMatType, typename alignedVecType, bool reverseOp>
  90. static int comp_vec4_mul_mat4(std::size_t Samples)
  91. {
  92. typedef typename packedMatType::value_type T;
  93. int Error = 0;
  94. packedMatType const Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16);
  95. packedVecType const Scale(0.01, 0.02, 0.03, 0.05);
  96. std::vector<packedVecType> SISD;
  97. std::printf("- SISD: %d us\n", launch_vec_mul_mat<packedMatType, packedVecType, reverseOp>(SISD, Transform, Scale, Samples));
  98. std::vector<alignedVecType> SIMD;
  99. std::printf("- SIMD: %d us\n", launch_vec_mul_mat<alignedMatType, alignedVecType, reverseOp>(SIMD, Transform, Scale, Samples));
  100. for(std::size_t i = 0; i < Samples; ++i)
  101. {
  102. packedVecType const A = SISD[i];
  103. packedVecType const B = SIMD[i];
  104. Error += glm::all(glm::equal(A, B, static_cast<T>(0.001))) ? 0 : 1;
  105. }
  106. return Error;
  107. }
  108. int main()
  109. {
  110. std::size_t const Samples = 1000;
  111. int Error = 0;
  112. std::printf("vec2 * mat2:\n");
  113. Error += comp_vec2_mul_mat2<glm::mat2, glm::vec2, glm::aligned_mat2, glm::aligned_vec2, false>(Samples);
  114. std::printf("dvec2 * dmat2:\n");
  115. Error += comp_vec2_mul_mat2<glm::dmat2, glm::dvec2,glm::aligned_dmat2, glm::aligned_dvec2, false>(Samples);
  116. std::printf("vec3 * mat3:\n");
  117. Error += comp_vec3_mul_mat3<glm::mat3, glm::vec3, glm::aligned_mat3, glm::aligned_vec3, false>(Samples);
  118. std::printf("dvec3 * dmat3:\n");
  119. Error += comp_vec3_mul_mat3<glm::dmat3, glm::dvec3, glm::aligned_dmat3, glm::aligned_dvec3, false>(Samples);
  120. std::printf("vec4 * mat4:\n");
  121. Error += comp_vec4_mul_mat4<glm::mat4, glm::vec4, glm::aligned_mat4, glm::aligned_vec4, false>(Samples);
  122. std::printf("dvec4 * dmat4:\n");
  123. Error += comp_vec4_mul_mat4<glm::dmat4, glm::dvec4, glm::aligned_dmat4, glm::aligned_dvec4, false>(Samples);
  124. std::printf("mat2 * vec2:\n");
  125. Error += comp_vec2_mul_mat2<glm::mat2, glm::vec2, glm::aligned_mat2, glm::aligned_vec2, true>(Samples);
  126. std::printf("dmat2 * dvec2 :\n");
  127. Error += comp_vec2_mul_mat2<glm::dmat2, glm::dvec2, glm::aligned_dmat2, glm::aligned_dvec2, true>(Samples);
  128. std::printf("mat3 * vec3:\n");
  129. Error += comp_vec3_mul_mat3<glm::mat3, glm::vec3, glm::aligned_mat3, glm::aligned_vec3, true>(Samples);
  130. std::printf("dmat3 * dvec3 :\n");
  131. Error += comp_vec3_mul_mat3<glm::dmat3, glm::dvec3, glm::aligned_dmat3, glm::aligned_dvec3, true>(Samples);
  132. std::printf("mat4 * vec4 :\n");
  133. Error += comp_vec4_mul_mat4<glm::mat4, glm::vec4, glm::aligned_mat4, glm::aligned_vec4, true>(Samples);
  134. std::printf("dmat4 * dvec4 :\n");
  135. Error += comp_vec4_mul_mat4<glm::dmat4, glm::dvec4, glm::aligned_dmat4, glm::aligned_dvec4, true>(Samples);
  136. return Error;
  137. }
  138. #else
  139. int main()
  140. {
  141. return 0;
  142. }
  143. #endif