// Auto-generated file. Do not edit! // Template: src/cs16-vsquareabs/scalar.c.in // Generator: tools/xngen // // Copyright 2022 Google LLC // // This source code is licensed under the BSD-style license found in the // LICENSE file in the root directory of this source tree. #include #include #include #include #include void xnn_cs16_vsquareabs_ukernel__scalar_x2( size_t batch, const int16_t* input, uint32_t* output) { assert(batch != 0); assert(batch % (sizeof(int16_t) * 2) == 0); assert(input != NULL); assert(output != NULL); for (; batch >= 4 * sizeof(int16_t); batch -= 4 * sizeof(int16_t)) { const int32_t vr0 = (int32_t) input[0]; const int32_t vi0 = (int32_t) input[1]; const int32_t vr1 = (int32_t) input[2]; const int32_t vi1 = (int32_t) input[3]; input += 2 * 2; uint32_t vacc0 = (uint32_t) (vr0 * vr0); uint32_t vacc1 = (uint32_t) (vr1 * vr1); vacc0 += (uint32_t) (vi0 * vi0); vacc1 += (uint32_t) (vi1 * vi1); output[0] = vacc0; output[1] = vacc1; output += 2; } if XNN_LIKELY(batch != 0) { assert(batch == 2 * sizeof(int16_t)); const int32_t vr = (int32_t) input[0]; const int32_t vi = (int32_t) input[1]; uint32_t vacc = (uint32_t) (vr * vr); vacc += (uint32_t) (vi * vi); *output = vacc; } }