diff --git a/test/CMakeLists.txt b/test/CMakeLists.txt index e83261f6..988d9d9e 100644 --- a/test/CMakeLists.txt +++ b/test/CMakeLists.txt @@ -13,6 +13,7 @@ if(GLM_TEST_ENABLE) add_subdirectory(ext) add_subdirectory(gtc) add_subdirectory(gtx) + add_subdirectory(perf) endif() diff --git a/test/core/CMakeLists.txt b/test/core/CMakeLists.txt index 366fc9d1..0af7fe29 100644 --- a/test/core/CMakeLists.txt +++ b/test/core/CMakeLists.txt @@ -42,7 +42,3 @@ glmCreateTestGTC(core_setup_force_cxx98) glmCreateTestGTC(core_setup_force_size_t_length) glmCreateTestGTC(core_setup_message) glmCreateTestGTC(core_setup_precision) -glmCreateTestGTC(core_setup_simd) - - - diff --git a/test/perf/CMakeLists.txt b/test/perf/CMakeLists.txt new file mode 100644 index 00000000..3c12ef5e --- /dev/null +++ b/test/perf/CMakeLists.txt @@ -0,0 +1,2 @@ +glmCreateTestGTC(perf_matrix_mul) +glmCreateTestGTC(perf_matrix_div) diff --git a/test/core/core_setup_simd.cpp b/test/perf/perf_matrix_div.cpp similarity index 100% rename from test/core/core_setup_simd.cpp rename to test/perf/perf_matrix_div.cpp diff --git a/test/perf/perf_matrix_mul.cpp b/test/perf/perf_matrix_mul.cpp new file mode 100644 index 00000000..7c57b7ec --- /dev/null +++ b/test/perf/perf_matrix_mul.cpp @@ -0,0 +1,73 @@ +#define GLM_FORCE_INLINE +#include +#include +#include +#include +#if GLM_CONFIG_SIMD == GLM_ENABLE +#include +#include +#include +#include + +template +static void test_mat_mul_mat(matType const& M, std::vector const& I, std::vector& O) +{ + for (std::size_t i = 0, n = I.size(); i < n; ++i) + O[i] = M * I[i]; +} + +template +static int launch_mat_mul_mat(std::vector& O, matType const& Transform, matType const& Scale, std::size_t Samples) +{ + typedef typename matType::value_type T; + + std::vector I(Samples); + O.resize(Samples); + + for(std::size_t i = 0; i < Samples; ++i) + I[i] = Scale * static_cast(i); + + std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now(); + test_mat_mul_mat(Transform, I, O); + std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now(); + + return static_cast(std::chrono::duration_cast(t2 - t1).count()); +} + +static int comp_mat_mul_mat(std::size_t Samples) +{ + int Error = 0; + + glm::mat4 const Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16); + glm::mat4 const Scale(0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05); + + std::vector Mat4SISD; + printf("mat4 * mat4 (SISD) duration %d us\n", launch_mat_mul_mat(Mat4SISD, Transform, Scale, Samples)); + + std::vector Mat4SIMD; + printf("mat4 * mat4 (SIMD) duration %d us\n", launch_mat_mul_mat(Mat4SIMD, Transform, Scale, Samples)); + + for(std::size_t i = 0; i < Samples; ++i) + Error += glm::all(glm::equal(Mat4SISD[i], Mat4SIMD[i], 0.001)) ? 0 : 1; + + return Error; +} + +int main() +{ + std::size_t const Samples = 100000; + + int Error = 0; + Error += comp_mat_mul_mat(Samples); + + return Error; +} + +#else + +int main() +{ + return 0; +} + +#endif