diff options
Diffstat (limited to 'third_party/intgemm/test/kernels/add_bias_test.cc')
-rw-r--r-- | third_party/intgemm/test/kernels/add_bias_test.cc | 66 |
1 files changed, 66 insertions, 0 deletions
diff --git a/third_party/intgemm/test/kernels/add_bias_test.cc b/third_party/intgemm/test/kernels/add_bias_test.cc new file mode 100644 index 0000000000..b9e5fd95f5 --- /dev/null +++ b/third_party/intgemm/test/kernels/add_bias_test.cc @@ -0,0 +1,66 @@ +#include "../test.h" +#include "../../intgemm/aligned.h" +#include "../../intgemm/kernels.h" + +#include <numeric> + +namespace intgemm { + +template <CPUType CPUType_, typename ElemType_> +void kernel_add_bias_test() { + if (kCPU < CPUType_) + return; + + using vec_t = vector_t<CPUType_, ElemType_>; + constexpr static auto VECTOR_LENGTH = sizeof(vec_t) / sizeof(ElemType_); + + AlignedVector<ElemType_> input(VECTOR_LENGTH); + AlignedVector<ElemType_> bias(VECTOR_LENGTH); + AlignedVector<ElemType_> output(VECTOR_LENGTH); + + std::iota(input.begin(), input.end(), static_cast<ElemType_>(0)); + std::fill(bias.begin(), bias.end(), static_cast<ElemType_>(100)); + + *output.template as<vec_t>() = kernels::add_bias(*input.template as<vec_t>(), bias.begin(), 0); + for (std::size_t i = 0; i < output.size(); ++i) + CHECK(output[i] == ElemType_(100 + i)); +} + +template INTGEMM_SSE2 void kernel_add_bias_test<CPUType::SSE2, int8_t>(); +template INTGEMM_SSE2 void kernel_add_bias_test<CPUType::SSE2, int16_t>(); +template INTGEMM_SSE2 void kernel_add_bias_test<CPUType::SSE2, int>(); +template INTGEMM_SSE2 void kernel_add_bias_test<CPUType::SSE2, float>(); +template INTGEMM_SSE2 void kernel_add_bias_test<CPUType::SSE2, double>(); +KERNEL_TEST_CASE("add_bias/int8 SSE2") { return kernel_add_bias_test<CPUType::SSE2, int8_t>(); } +KERNEL_TEST_CASE("add_bias/int16 SSE2") { return kernel_add_bias_test<CPUType::SSE2, int16_t>(); } +KERNEL_TEST_CASE("add_bias/int SSE2") { return kernel_add_bias_test<CPUType::SSE2, int>(); } +KERNEL_TEST_CASE("add_bias/float SSE2") { return kernel_add_bias_test<CPUType::SSE2, float>(); } +KERNEL_TEST_CASE("add_bias/double SSE2") { return kernel_add_bias_test<CPUType::SSE2, double>(); } + +#ifdef INTGEMM_COMPILER_SUPPORTS_AVX2 +template INTGEMM_AVX2 void kernel_add_bias_test<CPUType::AVX2, int8_t>(); +template INTGEMM_AVX2 void kernel_add_bias_test<CPUType::AVX2, int16_t>(); +template INTGEMM_AVX2 void kernel_add_bias_test<CPUType::AVX2, int>(); +template INTGEMM_AVX2 void kernel_add_bias_test<CPUType::AVX2, float>(); +template INTGEMM_AVX2 void kernel_add_bias_test<CPUType::AVX2, double>(); +KERNEL_TEST_CASE("add_bias/int8 AVX2") { return kernel_add_bias_test<CPUType::AVX2, int8_t>(); } +KERNEL_TEST_CASE("add_bias/int16 AVX2") { return kernel_add_bias_test<CPUType::AVX2, int16_t>(); } +KERNEL_TEST_CASE("add_bias/int AVX2") { return kernel_add_bias_test<CPUType::AVX2, int>(); } +KERNEL_TEST_CASE("add_bias/float AVX2") { return kernel_add_bias_test<CPUType::AVX2, float>(); } +KERNEL_TEST_CASE("add_bias/double AVX2") { return kernel_add_bias_test<CPUType::AVX2, double>(); } +#endif + +#ifdef INTGEMM_COMPILER_SUPPORTS_AVX512BW +template INTGEMM_AVX512BW void kernel_add_bias_test<CPUType::AVX512BW, int8_t>(); +template INTGEMM_AVX512BW void kernel_add_bias_test<CPUType::AVX512BW, int16_t>(); +template INTGEMM_AVX512BW void kernel_add_bias_test<CPUType::AVX512BW, int>(); +template INTGEMM_AVX512BW void kernel_add_bias_test<CPUType::AVX512BW, float>(); +template INTGEMM_AVX512BW void kernel_add_bias_test<CPUType::AVX512BW, double>(); +KERNEL_TEST_CASE("add_bias/int8 AVX512BW") { return kernel_add_bias_test<CPUType::AVX512BW, int8_t>(); } +KERNEL_TEST_CASE("add_bias/int16 AVX512BW") { return kernel_add_bias_test<CPUType::AVX512BW, int16_t>(); } +KERNEL_TEST_CASE("add_bias/int AVX512BW") { return kernel_add_bias_test<CPUType::AVX512BW, int>(); } +KERNEL_TEST_CASE("add_bias/float AVX512BW") { return kernel_add_bias_test<CPUType::AVX512BW, float>(); } +KERNEL_TEST_CASE("add_bias/double AVX512BW") { return kernel_add_bias_test<CPUType::AVX512BW, double>(); } +#endif + +} |