/////////////////////////////////////////////////////////////////////////////////////////////////// // OpenGL Mathematics Copyright (c) 2005 - 2010 G-Truc Creation (www.g-truc.net) /////////////////////////////////////////////////////////////////////////////////////////////////// // Created : 2010-09-16 // Updated : 2010-09-16 // Licence : This source is under MIT licence // File : test/gtx/simd-mat4.cpp /////////////////////////////////////////////////////////////////////////////////////////////////// #define GLM_INSTRUCTION_SET GLM_PLATFORM_SSE3 | GLM_PLATFORM_SSE2 #include #include #include #include #include #include #include std::vector test_detA(std::vector const & Data) { std::vector Test(Data.size()); std::clock_t TimeStart = clock(); for(std::size_t i = 0; i < Test.size() - 1; ++i) Test[i] = glm::determinant(Data[i]); std::clock_t TimeEnd = clock(); printf("Det A: %d\n", TimeEnd - TimeStart); return Test; } std::vector test_detB(std::vector const & Data) { std::vector Test(Data.size()); std::clock_t TimeStart = clock(); for(std::size_t i = 0; i < Test.size() - 1; ++i) { _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0); glm::simd_mat4 m(Data[i]); Test[i] = glm::simd_vec4(glm::detail::sse_slow_det_ps((__m128 const * const)&m)).x; } std::clock_t TimeEnd = clock(); printf("Det B: %d\n", TimeEnd - TimeStart); return Test; } std::vector test_detC(std::vector const & Data) { std::vector Test(Data.size()); std::clock_t TimeStart = clock(); for(std::size_t i = 0; i < Test.size() - 1; ++i) { _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0); glm::simd_mat4 m(Data[i]); Test[i] = glm::simd_vec4(glm::detail::sse_det_ps((__m128 const * const)&m)).x; } std::clock_t TimeEnd = clock(); printf("Det C: %d\n", TimeEnd - TimeStart); return Test; } std::vector test_detD(std::vector const & Data) { std::vector Test(Data.size()); std::clock_t TimeStart = clock(); for(std::size_t i = 0; i < Test.size() - 1; ++i) { _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0); glm::simd_mat4 m(Data[i]); Test[i] = glm::simd_vec4(glm::detail::sse_detd_ps((__m128 const * const)&m)).x; } std::clock_t TimeEnd = clock(); printf("Det D: %d\n", TimeEnd - TimeStart); return Test; } void test_invA(std::vector const & Data, std::vector & Out) { //std::vector Test(Data.size()); Out.resize(Data.size()); std::clock_t TimeStart = clock(); for(std::size_t i = 0; i < Out.size() - 1; ++i) { Out[i] = glm::inverse(Data[i]); } std::clock_t TimeEnd = clock(); printf("Inv A: %d\n", TimeEnd - TimeStart); } void test_invC(std::vector const & Data, std::vector & Out) { //std::vector Test(Data.size()); Out.resize(Data.size()); std::clock_t TimeStart = clock(); for(std::size_t i = 0; i < Out.size() - 1; ++i) { _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0); glm::simd_mat4 m(Data[i]); glm::simd_mat4 o; glm::detail::sse_inverse_fast_ps((__m128 const * const)&m, (__m128 *)&o); Out[i] = *(glm::mat4*)&o; } std::clock_t TimeEnd = clock(); printf("Inv C: %d\n", TimeEnd - TimeStart); } void test_invD(std::vector const & Data, std::vector & Out) { //std::vector Test(Data.size()); Out.resize(Data.size()); std::clock_t TimeStart = clock(); for(std::size_t i = 0; i < Out.size() - 1; ++i) { _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0); glm::simd_mat4 m(Data[i]); glm::simd_mat4 o; glm::detail::sse_inverse_ps((__m128 const * const)&m, (__m128 *)&o); Out[i] = *(glm::mat4*)&o; } std::clock_t TimeEnd = clock(); printf("Inv D: %d\n", TimeEnd - TimeStart); } void test_mulA(std::vector const & Data, std::vector & Out) { //std::vector Test(Data.size()); Out.resize(Data.size()); std::clock_t TimeStart = clock(); for(std::size_t i = 0; i < Out.size() - 1; ++i) { Out[i] = Data[i] * Data[i]; } std::clock_t TimeEnd = clock(); printf("Mul A: %d\n", TimeEnd - TimeStart); } void test_mulD(std::vector const & Data, std::vector & Out) { //std::vector Test(Data.size()); Out.resize(Data.size()); std::clock_t TimeStart = clock(); for(std::size_t i = 0; i < Out.size() - 1; ++i) { _mm_prefetch((char*)&Data[i + 1], _MM_HINT_T0); glm::simd_mat4 m(Data[i]); glm::detail::sse_mul_ps((__m128 const * const)&m, (__m128 const * const)&m, (__m128*)&Out[i]); } std::clock_t TimeEnd = clock(); printf("Mul D: %d\n", TimeEnd - TimeStart); } int main(int argc, void* argv[]) { std::vector Data(1024 * 1024 * 8); for(std::size_t i = 0; i < Data.size(); ++i) Data[i] = glm::mat4( glm::vec4(glm::compRand4(-2.0f, 2.0f)), glm::vec4(glm::compRand4(-2.0f, 2.0f)), glm::vec4(glm::compRand4(-2.0f, 2.0f)), glm::vec4(glm::compRand4(-2.0f, 2.0f))); { std::vector TestInvA; test_invA(Data, TestInvA); } { std::vector TestInvC; test_invC(Data, TestInvC); } { std::vector TestInvD; test_invD(Data, TestInvD); } { std::vector TestA; test_mulA(Data, TestA); } { std::vector TestD; test_mulD(Data, TestD); } { std::vector TestDetA = test_detA(Data); std::vector TestDetB = test_detB(Data); std::vector TestDetC = test_detC(Data); std::vector TestDetD = test_detD(Data); for(std::size_t i = 0; i < TestDetA.size(); ++i) if(TestDetA[i] != TestDetB[i] && TestDetC[i] != TestDetB[i] && TestDetC[i] != TestDetD[i]) return 1; } // shuffle test glm::simd_vec4 A(1.0f, 2.0f, 3.0f, 4.0f); glm::simd_vec4 B(5.0f, 6.0f, 7.0f, 8.0f); __m128 C = _mm_shuffle_ps(A.Data, B.Data, _MM_SHUFFLE(1, 0, 1, 0)); system("pause"); return 0; }