1*4bdc9457SAndroid Build Coastguard Worker // Copyright 2022 Google LLC 2*4bdc9457SAndroid Build Coastguard Worker // 3*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the 4*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree. 5*4bdc9457SAndroid Build Coastguard Worker 6*4bdc9457SAndroid Build Coastguard Worker #include <assert.h> 7*4bdc9457SAndroid Build Coastguard Worker #include <stddef.h> 8*4bdc9457SAndroid Build Coastguard Worker #include <math.h> 9*4bdc9457SAndroid Build Coastguard Worker 10*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/common.h> 11*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/math-stubs.h> 12*4bdc9457SAndroid Build Coastguard Worker 13*4bdc9457SAndroid Build Coastguard Worker xnn_math_u32_sqrt__scalar_cvtu32_sqrtf_lrintf(size_t n,const uint32_t * input,uint32_t * output)14*4bdc9457SAndroid Build Coastguard Workervoid xnn_math_u32_sqrt__scalar_cvtu32_sqrtf_lrintf( 15*4bdc9457SAndroid Build Coastguard Worker size_t n, 16*4bdc9457SAndroid Build Coastguard Worker const uint32_t* input, 17*4bdc9457SAndroid Build Coastguard Worker uint32_t* output) 18*4bdc9457SAndroid Build Coastguard Worker { 19*4bdc9457SAndroid Build Coastguard Worker assert(n % sizeof(uint32_t) == 0); 20*4bdc9457SAndroid Build Coastguard Worker 21*4bdc9457SAndroid Build Coastguard Worker for (; n != 0; n -= sizeof(uint32_t)) { 22*4bdc9457SAndroid Build Coastguard Worker const uint32_t vx = *input++; 23*4bdc9457SAndroid Build Coastguard Worker 24*4bdc9457SAndroid Build Coastguard Worker uint32_t vy = vx; 25*4bdc9457SAndroid Build Coastguard Worker if XNN_LIKELY(vx != 0) { 26*4bdc9457SAndroid Build Coastguard Worker float vf = (float) vx; 27*4bdc9457SAndroid Build Coastguard Worker vf = sqrtf(vf); 28*4bdc9457SAndroid Build Coastguard Worker vy = (uint32_t) (int32_t) lrintf(vf); 29*4bdc9457SAndroid Build Coastguard Worker const uint32_t vsquared_y_less_x = vy * vy - vx; 30*4bdc9457SAndroid Build Coastguard Worker if XNN_UNPREDICTABLE((int32_t) (vsquared_y_less_x + vy) < 0) { 31*4bdc9457SAndroid Build Coastguard Worker vy += 1; 32*4bdc9457SAndroid Build Coastguard Worker } else if XNN_UNPREDICTABLE((int32_t) (vsquared_y_less_x - vy) >= 0) { 33*4bdc9457SAndroid Build Coastguard Worker vy -= 1; 34*4bdc9457SAndroid Build Coastguard Worker } 35*4bdc9457SAndroid Build Coastguard Worker } 36*4bdc9457SAndroid Build Coastguard Worker 37*4bdc9457SAndroid Build Coastguard Worker *output++ = vy; 38*4bdc9457SAndroid Build Coastguard Worker } 39*4bdc9457SAndroid Build Coastguard Worker } 40