/* * Copyright (c) 2018 Vikrant More * * SPDX-License-Identifier: Apache-2.0 */ #include #include #include #include #include #define MAX_F_ITTERATIONS 6 /* usually converges in 4 loops */ /* this ensures we break out of the loop */ #define MAX_F_ERROR_COUNT 3 /* when result almost converges, stop */ #define EXP_MASK32 GENMASK(30, 23) float sqrtf(float square) { int i; float root; float last; int32_t exponent; int32_t *p_square = (int32_t *)□ int32_t *p_root = (int32_t *)&root; int32_t *p_last = (int32_t *)&last; if (square == 0.0f) { return square; } if (square < 0.0f) { return (square - square) / (square - square); } /* we need a good starting guess so that this will converge quickly, * we can do this by dividing the exponent part of the float by 2 * this assumes IEEE-754 format doubles */ exponent = ((*p_square & EXP_MASK32)>>23)-127; if (exponent == 0xFF-127) { /* the number is a NAN or inf, return NaN or inf */ return square + square; } exponent /= 2; *p_root = (*p_square & ~EXP_MASK32) | (exponent+127) << 23; for (i = 0; i < MAX_F_ITTERATIONS; i++) { last = root; root = (root + square / root) * 0.5f; /* if (labs(*p_root - *p_last) < MAX_F_ERROR_COUNT) */ if ((*p_root ^ *p_last) < MAX_F_ERROR_COUNT) { break; } } return root; }