#define GLM_FORCE_INLINE #include #include #include #if GLM_CONFIG_SIMD == GLM_ENABLE #include #include #include #include template static void test_mat_mul_vec(matType const& M, std::vector const& I, std::vector& O) { typedef typename vecType::value_type T; for (std::size_t i = 0, n = I.size(); i < n; ++i) O[i] = M * I[i]; } template static int launch_mat_mul_vec(std::size_t Samples) { typedef typename vecType::value_type T; static const matType Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16); { std::vector I(Samples); std::vector O(Samples); for(std::size_t i = 0; i < Samples; ++i) I[i] = vecType(static_cast(i)) * vecType(0.01, 0.02, 0.03, 0.05); std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now(); test_mat_mul_vec(Transform, I, O); std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now(); return static_cast(std::chrono::duration_cast(t2 - t1).count()); } } template static void test_vec_mul_mat(matType const& M, std::vector const& I, std::vector& O) { typedef typename vecType::value_type T; for (std::size_t i = 0, n = I.size(); i < n; ++i) O[i] = I[i] * M; } template static int launch_vec_mul_mat(std::size_t Samples) { typedef typename vecType::value_type T; static const matType Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16); std::vector I(Samples); std::vector O(Samples); for(std::size_t i = 0; i < Samples; ++i) I[i] = vecType(static_cast(i)) * vecType(0.01, 0.02, 0.03, 0.05); std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now(); test_mat_mul_vec(Transform, I, O); std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now(); return static_cast(std::chrono::duration_cast(t2 - t1).count()); } template static void test_mat_mul_mat(matType const& M, std::vector const& I, std::vector& O) { typedef typename matType::value_type T; for (std::size_t i = 0, n = I.size(); i < n; ++i) O[i] = M * I[i]; } template static int launch_mat_mul_mat(std::size_t Samples) { typedef typename matType::value_type T; static const matType Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16); { std::vector I(Samples); std::vector O(Samples); for(std::size_t i = 0; i < Samples; ++i) I[i] = matType(static_cast(i)) * matType(0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05); std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now(); test_mat_mul_mat(Transform, I, O); std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now(); return static_cast(std::chrono::duration_cast(t2 - t1).count()); } } template static void test_mat_div_mat(matType const& M, std::vector const& I, std::vector& O) { typedef typename matType::value_type T; for (std::size_t i = 0, n = I.size(); i < n; ++i) O[i] = M / I[i]; } template static int launch_mat_div_mat(std::size_t Samples) { typedef typename matType::value_type T; static const matType Transform(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16); { std::vector I(Samples); std::vector O(Samples); for(std::size_t i = 0; i < Samples; ++i) I[i] = matType(static_cast(i)) * matType(0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05, 0.01, 0.02, 0.03, 0.05); std::chrono::high_resolution_clock::time_point t1 = std::chrono::high_resolution_clock::now(); test_mat_div_mat(Transform, I, O); std::chrono::high_resolution_clock::time_point t2 = std::chrono::high_resolution_clock::now(); return static_cast(std::chrono::duration_cast(t2 - t1).count()); } } int main() { std::size_t const Samples = 50000; printf("\nmat4 * vec4\n"); printf("- dmat4 * dvec4 duration %d us\n", launch_mat_mul_vec(Samples)); printf("- dmat4 * dvec4 (SIMD) duration %d us\n", launch_mat_mul_vec(Samples)); printf("- mat4 * vec4 duration %d us\n", launch_mat_mul_vec(Samples)); printf("- mat4 * vec4 (SIMD) duration %d us\n", launch_mat_mul_vec(Samples)); printf("\nvec4 * mat4\n"); printf("- dvec4 * dmat4 duration %d us\n", launch_vec_mul_mat(Samples)); printf("- dvec4 * dmat4 (SIMD) duration %d us\n", launch_vec_mul_mat(Samples)); printf("- vec4 * mat4 duration %d us\n", launch_vec_mul_mat(Samples)); printf("- vec4 * mat4 (SIMD) duration %d us\n", launch_vec_mul_mat(Samples)); printf("\nmat4 * mat4\n"); printf("- dmat4 * dmat4 duration %d us\n", launch_mat_mul_mat(Samples)); printf("- dmat4 * dmat4 (SIMD) duration %d us\n", launch_mat_mul_mat(Samples)); printf("- mat4 * mat4 duration %d us\n", launch_mat_mul_mat(Samples)); printf("- mat4 * mat4 (SIMD) duration %d us\n", launch_mat_mul_mat(Samples)); printf("\nmat4 / mat4\n"); printf("- dmat4 / dmat4 duration %d us\n", launch_mat_div_mat(Samples)); printf("- dmat4 / dmat4 (SIMD) duration %d us\n", launch_mat_div_mat(Samples)); printf("- mat4 / mat4 duration %d us\n", launch_mat_div_mat(Samples)); printf("- mat4 / mat4 (SIMD) duration %d us\n", launch_mat_div_mat(Samples)); return 0; } #else int main() { return 0; } #endif