Fixed bad matrix-vector performance in Cuda #257, #258

This commit is contained in:
Christophe Riccio 2014-10-29 00:42:59 +01:00
parent bf9e4458b6
commit e8923c9bca
2 changed files with 2 additions and 2 deletions

View File

@ -735,7 +735,7 @@
# define GLM_ALIGNED_STRUCT(x) __declspec(align(x)) struct # define GLM_ALIGNED_STRUCT(x) __declspec(align(x)) struct
# define GLM_RESTRICT # define GLM_RESTRICT
# define GLM_RESTRICT_VAR __restrict # define GLM_RESTRICT_VAR __restrict
#elif GLM_COMPILER & (GLM_COMPILER_GCC | GLM_COMPILER_CLANG) #elif GLM_COMPILER & (GLM_COMPILER_GCC | GLM_COMPILER_CLANG | GLM_COMPILER_CUDA)
# define GLM_DEPRECATED __attribute__((__deprecated__)) # define GLM_DEPRECATED __attribute__((__deprecated__))
# define GLM_ALIGN(x) __attribute__((aligned(x))) # define GLM_ALIGN(x) __attribute__((aligned(x)))
# define GLM_ALIGNED_STRUCT(x) struct __attribute__((aligned(x))) # define GLM_ALIGNED_STRUCT(x) struct __attribute__((aligned(x)))

View File

@ -67,7 +67,7 @@ namespace detail
}//namespace detail }//namespace detail
template <typename T, precision P = defaultp> template <typename T, precision P = defaultp>
struct tvec4 GLM_ALIGNED_STRUCT(16) tvec4
{ {
////////////////////////////////////// //////////////////////////////////////
// Implementation detail // Implementation detail