From e19734f6fcdf5fd9a395d6d18d9d23b0f36c37a9 Mon Sep 17 00:00:00 2001 From: Groove Date: Sat, 18 Aug 2018 16:12:26 +0200 Subject: [PATCH] Added SIMD perf tests --- glm/detail/func_matrix.inl | 3 - test/core/CMakeLists.txt | 1 + test/core/core_setup_simd.cpp | 171 ++++++++++++++++++++++++++++++++++ 3 files changed, 172 insertions(+), 3 deletions(-) create mode 100644 test/core/core_setup_simd.cpp diff --git a/glm/detail/func_matrix.inl b/glm/detail/func_matrix.inl index e38f3ee4..d980c6d3 100644 --- a/glm/detail/func_matrix.inl +++ b/glm/detail/func_matrix.inl @@ -1,6 +1,3 @@ -/// @ref core -/// @file glm/detail/func_matrix.inl - #include "../geometric.hpp" #include diff --git a/test/core/CMakeLists.txt b/test/core/CMakeLists.txt index 2ea39ed9..366fc9d1 100644 --- a/test/core/CMakeLists.txt +++ b/test/core/CMakeLists.txt @@ -42,6 +42,7 @@ glmCreateTestGTC(core_setup_force_cxx98) glmCreateTestGTC(core_setup_force_size_t_length) glmCreateTestGTC(core_setup_message) glmCreateTestGTC(core_setup_precision) +glmCreateTestGTC(core_setup_simd) diff --git a/test/core/core_setup_simd.cpp b/test/core/core_setup_simd.cpp new file mode 100644 index 00000000..b8f3de01 --- /dev/null +++ b/test/core/core_setup_simd.cpp @@ -0,0 +1,171 @@ +#define GLM_FORCE_INLINE +#include +#include +#include +#if GLM_CONFIG_SIMD == GLM_ENABLE +#include +#include +#include +#include + +template +static void test_mat_mul_vec(matType const& M, std::vector const& I, std::vector& O) +{ + typedef typename vecType::value_type T; + + for (std::size_t i = 0, n = I.size(); i < n; ++i) + O[i] = M * I[i]; +} + +template +static int launch_mat_mul_vec(std::size_t Samples) +{ + typedef typename vecType::value_type T; + + static const matType Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16); + + { + std::vector I(Samples); + std::vector O(Samples); + + for(std::size_t i = 0; i < Samples; ++i) + I[i] = vecType(static_cast(i)) * vecType(0.01, 0.02, 0.03, 0.05); + + std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now(); + test_mat_mul_vec(Transform, I, O); + std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now(); + + return static_cast(std::chrono::duration_cast(t2 - t1).count()); + } +} + +template +static void test_vec_mul_mat(matType const& M, std::vector const& I, std::vector& O) +{ + typedef typename vecType::value_type T; + + for (std::size_t i = 0, n = I.size(); i < n; ++i) + O[i] = I[i] * M; +} + +template +static int launch_vec_mul_mat(std::size_t Samples) +{ + typedef typename vecType::value_type T; + + static const matType Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16); + + std::vector I(Samples); + std::vector O(Samples); + + for(std::size_t i = 0; i < Samples; ++i) + I[i] = vecType(static_cast(i)) * vecType(0.01, 0.02, 0.03, 0.05); + + std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now(); + test_mat_mul_vec(Transform, I, O); + std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now(); + + return static_cast(std::chrono::duration_cast(t2 - t1).count()); +} + +template +static void test_mat_mul_mat(matType const& M, std::vector const& I, std::vector& O) +{ + typedef typename matType::value_type T; + + for (std::size_t i = 0, n = I.size(); i < n; ++i) + O[i] = M * I[i]; +} + +template +static int launch_mat_mul_mat(std::size_t Samples) +{ + typedef typename matType::value_type T; + + static const matType Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16); + + { + std::vector I(Samples); + std::vector O(Samples); + + for(std::size_t i = 0; i < Samples; ++i) + I[i] = matType(static_cast(i)) * matType(0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05); + + std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now(); + test_mat_mul_mat(Transform, I, O); + std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now(); + + return static_cast(std::chrono::duration_cast(t2 - t1).count()); + } +} + +template +static void test_mat_div_mat(matType const& M, std::vector const& I, std::vector& O) +{ + typedef typename matType::value_type T; + + for (std::size_t i = 0, n = I.size(); i < n; ++i) + O[i] = M / I[i]; +} + +template +static int launch_mat_div_mat(std::size_t Samples) +{ + typedef typename matType::value_type T; + + static const matType Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16); + + { + std::vector I(Samples); + std::vector O(Samples); + + for(std::size_t i = 0; i < Samples; ++i) + I[i] = matType(static_cast(i)) * matType(0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05); + + std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now(); + test_mat_div_mat(Transform, I, O); + std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now(); + + return static_cast(std::chrono::duration_cast(t2 - t1).count()); + } +} + +int main() +{ + std::size_t const Samples = 50000; + + printf("\nmat4 * vec4\n"); + printf("- dmat4 * dvec4 duration %d us\n", launch_mat_mul_vec(Samples)); + printf("- dmat4 * dvec4 (SIMD) duration %d us\n", launch_mat_mul_vec(Samples)); + printf("- mat4 * vec4 duration %d us\n", launch_mat_mul_vec(Samples)); + printf("- mat4 * vec4 (SIMD) duration %d us\n", launch_mat_mul_vec(Samples)); + + printf("\nvec4 * mat4\n"); + printf("- dvec4 * dmat4 duration %d us\n", launch_vec_mul_mat(Samples)); + printf("- dvec4 * dmat4 (SIMD) duration %d us\n", launch_vec_mul_mat(Samples)); + printf("- vec4 * mat4 duration %d us\n", launch_vec_mul_mat(Samples)); + printf("- vec4 * mat4 (SIMD) duration %d us\n", launch_vec_mul_mat(Samples)); + + printf("\nmat4 * mat4\n"); + printf("- dmat4 * dmat4 duration %d us\n", launch_mat_mul_mat(Samples)); + printf("- dmat4 * dmat4 (SIMD) duration %d us\n", launch_mat_mul_mat(Samples)); + printf("- mat4 * mat4 duration %d us\n", launch_mat_mul_mat(Samples)); + printf("- mat4 * mat4 (SIMD) duration %d us\n", launch_mat_mul_mat(Samples)); + + printf("\nmat4 / mat4\n"); + printf("- dmat4 / dmat4 duration %d us\n", launch_mat_div_mat(Samples)); + printf("- dmat4 / dmat4 (SIMD) duration %d us\n", launch_mat_div_mat(Samples)); + printf("- mat4 / mat4 duration %d us\n", launch_mat_div_mat(Samples)); + printf("- mat4 / mat4 (SIMD) duration %d us\n", launch_mat_div_mat(Samples)); + + return 0; +} + +#else + +int main() +{ + return 0; +} + +#endif