// Auto-generated file. Do not edit! // Template: src/f32-vrsqrt/scalar-rsqrt.c.in // Generator: tools/xngen // // Copyright 2024 Google LLC // // This source code is licensed under the BSD-style license found in the // LICENSE file in the root directory of this source tree. #include #include #include "xnnpack/common.h" #include "xnnpack/vunary.h" void xnn_f32_vrsqrt_ukernel__scalar_rsqrt_u4( size_t batch, const float* input, float* output, const struct xnn_f32_default_params params[restrict XNN_MIN_ELEMENTS(1)]) { assert(batch != 0); assert(batch % sizeof(float) == 0); assert(input != NULL); assert(output != NULL); for (; batch >= 4 * sizeof(float); batch -= 4 * sizeof(float)) { const float vx0 = input[0]; const float vx1 = input[1]; const float vx2 = input[2]; const float vx3 = input[3]; input += 4; const float vt0 = sqrtf(vx0); const float vt1 = sqrtf(vx1); const float vt2 = sqrtf(vx2); const float vt3 = sqrtf(vx3); const float vy0 = 1.0f / vt0; const float vy1 = 1.0f / vt1; const float vy2 = 1.0f / vt2; const float vy3 = 1.0f / vt3; output[0] = vy0; output[1] = vy1; output[2] = vy2; output[3] = vy3; output += 4; } if XNN_UNLIKELY(batch != 0) { do { const float vx = *input++; const float vy = 1.0f / sqrtf(vx); *output++ = vy; batch -= sizeof(float); } while (batch != 0); } }