// Copyright 2023 Google LLC // // This source code is licensed under the BSD-style license found in the // LICENSE file in the root directory of this source tree. #ifndef XNN_UKERNEL_WITH_PARAMS #define XNN_UKERNEL_WITH_PARAMS(arch_flags, ukernel, batch_tile, vector_tile, datatype, params_type, init_params) \ XNN_UKERNEL(arch_flags, ukernel, batch_tile, vector_tile, datatype) #define XNN_DEFINED_UKERNEL_WITH_PARAMS #endif #ifndef XNN_UKERNEL #define XNN_UKERNEL(arch_flags, ukernel, batch_tile, vector_tile, datatype) \ XNN_UKERNEL_WITH_PARAMS(arch_flags, ukernel, batch_tile, vector_tile, datatype, void, /*init_params=*/nullptr) #define XNN_DEFINED_UKERNEL #endif #if XNN_ARCH_X86 || XNN_ARCH_X86_64 XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_f16c, xnn_f16_vtanh_ukernel__f16c_expm1minus_rr1_p3h2ts_div_u8, 8, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_f16c, xnn_f16_vtanh_ukernel__f16c_expm1minus_rr1_p3h2ts_div_u16, 16, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_f16c, xnn_f16_vtanh_ukernel__f16c_expm1minus_rr1_p3h2ts_div_u24, 24, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_f16c, xnn_f16_vtanh_ukernel__f16c_expm1minus_rr1_p3h2ts_div_u32, 32, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_f16c, xnn_f16_vtanh_ukernel__f16c_expm1minus_rr1_p3h2ts_rcp_u8, 8, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_f16c, xnn_f16_vtanh_ukernel__f16c_expm1minus_rr1_p3h2ts_rcp_u16, 16, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_f16c, xnn_f16_vtanh_ukernel__f16c_expm1minus_rr1_p3h2ts_rcp_u24, 24, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_f16c, xnn_f16_vtanh_ukernel__f16c_expm1minus_rr1_p3h2ts_rcp_u32, 32, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_f16c, xnn_f16_vtanh_ukernel__f16c_polynomial_p19h9t2_u8, 8, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_f16c, xnn_f16_vtanh_ukernel__f16c_polynomial_p19h9t2_u16, 16, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_f16c, xnn_f16_vtanh_ukernel__f16c_polynomial_p19h9t2_u24, 24, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_f16c, xnn_f16_vtanh_ukernel__f16c_polynomial_p19h9t2_u32, 32, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_fma3, xnn_f16_vtanh_ukernel__fma3_expm1minus_rr1_p3h2ts_div_u8, 8, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_fma3, xnn_f16_vtanh_ukernel__fma3_expm1minus_rr1_p3h2ts_div_u16, 16, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_fma3, xnn_f16_vtanh_ukernel__fma3_expm1minus_rr1_p3h2ts_div_u24, 24, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_fma3, xnn_f16_vtanh_ukernel__fma3_expm1minus_rr1_p3h2ts_div_u32, 32, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_fma3, xnn_f16_vtanh_ukernel__fma3_expm1minus_rr1_p3h2ts_rcp_u8, 8, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_fma3, xnn_f16_vtanh_ukernel__fma3_expm1minus_rr1_p3h2ts_rcp_u16, 16, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_fma3, xnn_f16_vtanh_ukernel__fma3_expm1minus_rr1_p3h2ts_rcp_u24, 24, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_fma3, xnn_f16_vtanh_ukernel__fma3_expm1minus_rr1_p3h2ts_rcp_u32, 32, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_fma3, xnn_f16_vtanh_ukernel__fma3_polynomial_p19h9t2_u8, 8, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_fma3, xnn_f16_vtanh_ukernel__fma3_polynomial_p19h9t2_u16, 16, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_fma3, xnn_f16_vtanh_ukernel__fma3_polynomial_p19h9t2_u24, 24, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_fma3, xnn_f16_vtanh_ukernel__fma3_polynomial_p19h9t2_u32, 32, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_avx2, xnn_f16_vtanh_ukernel__avx2_expm1minus_rr1_p3h2ts_div_u8, 8, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_avx2, xnn_f16_vtanh_ukernel__avx2_expm1minus_rr1_p3h2ts_div_u16, 16, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_avx2, xnn_f16_vtanh_ukernel__avx2_expm1minus_rr1_p3h2ts_div_u24, 24, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_avx2, xnn_f16_vtanh_ukernel__avx2_expm1minus_rr1_p3h2ts_div_u32, 32, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_avx2, xnn_f16_vtanh_ukernel__avx2_expm1minus_rr1_p3h2ts_rcp_u8, 8, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_avx2, xnn_f16_vtanh_ukernel__avx2_expm1minus_rr1_p3h2ts_rcp_u16, 16, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_avx2, xnn_f16_vtanh_ukernel__avx2_expm1minus_rr1_p3h2ts_rcp_u24, 24, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_x86_avx2, xnn_f16_vtanh_ukernel__avx2_expm1minus_rr1_p3h2ts_rcp_u32, 32, false, xnn_float16, struct xnn_f16_default_params, NULL) #endif // XNN_ARCH_X86 || XNN_ARCH_X86_64 #if XNN_ENABLE_ARM_FP16_VECTOR && (XNN_ARCH_ARM64) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__aarch64_neonfp16arith_expm1minus_rr1_p3h2ts_div_u8, 8, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__aarch64_neonfp16arith_expm1minus_rr1_p3h2ts_div_u16, 16, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__aarch64_neonfp16arith_expm1minus_rr1_p3h2ts_div_u24, 24, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__aarch64_neonfp16arith_expm1minus_rr1_p3h2ts_div_u32, 32, false, xnn_float16, struct xnn_f16_default_params, NULL) #endif // XNN_ENABLE_ARM_FP16_VECTOR && (XNN_ARCH_ARM64) #if XNN_ENABLE_ARM_FP16_VECTOR && (XNN_ARCH_ARM || XNN_ARCH_ARM64) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__neonfp16arith_expm1minus_rr1_p3h2ts_nr1fma_u8, 8, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__neonfp16arith_expm1minus_rr1_p3h2ts_nr1fma_u16, 16, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__neonfp16arith_expm1minus_rr1_p3h2ts_nr1fma_u24, 24, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__neonfp16arith_expm1minus_rr1_p3h2ts_nr1fma_u32, 32, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__neonfp16arith_expm1minus_rr1_p3h2ts_nr1recps_u8, 8, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__neonfp16arith_expm1minus_rr1_p3h2ts_nr1recps_u16, 16, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__neonfp16arith_expm1minus_rr1_p3h2ts_nr1recps_u24, 24, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__neonfp16arith_expm1minus_rr1_p3h2ts_nr1recps_u32, 32, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__neonfp16arith_expm1minus_rr1_p3h2ts_recpeadj_u8, 8, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__neonfp16arith_expm1minus_rr1_p3h2ts_recpeadj_u16, 16, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__neonfp16arith_expm1minus_rr1_p3h2ts_recpeadj_u24, 24, false, xnn_float16, struct xnn_f16_default_params, NULL) XNN_UKERNEL_WITH_PARAMS(xnn_arch_arm_neon_fp16_arith, xnn_f16_vtanh_ukernel__neonfp16arith_expm1minus_rr1_p3h2ts_recpeadj_u32, 32, false, xnn_float16, struct xnn_f16_default_params, NULL) #endif // XNN_ENABLE_ARM_FP16_VECTOR && (XNN_ARCH_ARM || XNN_ARCH_ARM64) #ifdef XNN_DEFINED_UKERNEL_WITH_PARAMS #undef XNN_DEFINED_UKERNEL_WITH_PARAMS #undef XNN_UKERNEL_WITH_PARAMS #endif #ifdef XNN_DEFINED_UKERNEL #undef XNN_DEFINED_UKERNEL #undef XNN_UKERNEL #endif