Spaces:
Running
on
Zero
Running
on
Zero
template <typename matType> | |
static void test_mat_transpose(std::vector<matType> const& I, std::vector<matType>& O) | |
{ | |
for (std::size_t i = 0, n = I.size(); i < n; ++i) | |
O[i] = glm::transpose(I[i]); | |
} | |
template <typename matType> | |
static int launch_mat_transpose(std::vector<matType>& O, matType const& Scale, std::size_t Samples) | |
{ | |
typedef typename matType::value_type T; | |
std::vector<matType> I(Samples); | |
O.resize(Samples); | |
for(std::size_t i = 0; i < Samples; ++i) | |
I[i] = Scale * static_cast<T>(i) + Scale; | |
std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now(); | |
test_mat_transpose<matType>(I, O); | |
std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now(); | |
return static_cast<int>(std::chrono::duration_cast<std::chrono::microseconds>(t2 - t1).count()); | |
} | |
template <typename packedMatType, typename alignedMatType> | |
static int comp_mat2_transpose(std::size_t Samples) | |
{ | |
typedef typename packedMatType::value_type T; | |
int Error = 0; | |
packedMatType const Scale(0.01, 0.02, 0.03, 0.05); | |
std::vector<packedMatType> SISD; | |
std::printf("- SISD: %d us\n", launch_mat_transpose<packedMatType>(SISD, Scale, Samples)); | |
std::vector<alignedMatType> SIMD; | |
std::printf("- SIMD: %d us\n", launch_mat_transpose<alignedMatType>(SIMD, Scale, Samples)); | |
for(std::size_t i = 0; i < Samples; ++i) | |
{ | |
packedMatType const A = SISD[i]; | |
packedMatType const B = SIMD[i]; | |
Error += glm::all(glm::equal(A, B, static_cast<T>(0.001))) ? 0 : 1; | |
assert(!Error); | |
} | |
return Error; | |
} | |
template <typename packedMatType, typename alignedMatType> | |
static int comp_mat3_transpose(std::size_t Samples) | |
{ | |
typedef typename packedMatType::value_type T; | |
int Error = 0; | |
packedMatType const Scale(0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01); | |
std::vector<packedMatType> SISD; | |
std::printf("- SISD: %d us\n", launch_mat_transpose<packedMatType>(SISD, Scale, Samples)); | |
std::vector<alignedMatType> SIMD; | |
std::printf("- SIMD: %d us\n", launch_mat_transpose<alignedMatType>(SIMD, Scale, Samples)); | |
for(std::size_t i = 0; i < Samples; ++i) | |
{ | |
packedMatType const A = SISD[i]; | |
packedMatType const B = SIMD[i]; | |
Error += glm::all(glm::equal(A, B, static_cast<T>(0.001))) ? 0 : 1; | |
assert(!Error); | |
} | |
return Error; | |
} | |
template <typename packedMatType, typename alignedMatType> | |
static int comp_mat4_transpose(std::size_t Samples) | |
{ | |
typedef typename packedMatType::value_type T; | |
int Error = 0; | |
packedMatType const Scale(0.01, 0.02, 0.05, 0.04, 0.02, 0.08, 0.05, 0.01, 0.08, 0.03, 0.05, 0.06, 0.02, 0.03, 0.07, 0.05); | |
std::vector<packedMatType> SISD; | |
std::printf("- SISD: %d us\n", launch_mat_transpose<packedMatType>(SISD, Scale, Samples)); | |
std::vector<alignedMatType> SIMD; | |
std::printf("- SIMD: %d us\n", launch_mat_transpose<alignedMatType>(SIMD, Scale, Samples)); | |
for(std::size_t i = 0; i < Samples; ++i) | |
{ | |
packedMatType const A = SISD[i]; | |
packedMatType const B = SIMD[i]; | |
Error += glm::all(glm::equal(A, B, static_cast<T>(0.001))) ? 0 : 1; | |
assert(!Error); | |
} | |
return Error; | |
} | |
int main() | |
{ | |
std::size_t const Samples = 100000; | |
int Error = 0; | |
std::printf("glm::transpose(mat2):\n"); | |
Error += comp_mat2_transpose<glm::mat2, glm::aligned_mat2>(Samples); | |
std::printf("glm::transpose(dmat2):\n"); | |
Error += comp_mat2_transpose<glm::dmat2, glm::aligned_dmat2>(Samples); | |
std::printf("glm::transpose(mat3):\n"); | |
Error += comp_mat3_transpose<glm::mat3, glm::aligned_mat3>(Samples); | |
std::printf("glm::transpose(dmat3):\n"); | |
Error += comp_mat3_transpose<glm::dmat3, glm::aligned_dmat3>(Samples); | |
std::printf("glm::transpose(mat4):\n"); | |
Error += comp_mat4_transpose<glm::mat4, glm::aligned_mat4>(Samples); | |
std::printf("glm::transpose(dmat4):\n"); | |
Error += comp_mat4_transpose<glm::dmat4, glm::aligned_dmat4>(Samples); | |
return Error; | |
} | |
int main() | |
{ | |
return 0; | |
} | |