utils.h 5.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240
  1. /******************************************************************************
  2. * @file arm_math_utils.h
  3. * @brief Public header file for CMSIS DSP Library
  4. * @version V1.9.0
  5. * @date 20. July 2020
  6. ******************************************************************************/
  7. /*
  8. * Copyright (c) 2010-2020 Arm Limited or its affiliates. All rights reserved.
  9. *
  10. * SPDX-License-Identifier: Apache-2.0
  11. *
  12. * Licensed under the Apache License, Version 2.0 (the License); you may
  13. * not use this file except in compliance with the License.
  14. * You may obtain a copy of the License at
  15. *
  16. * www.apache.org/licenses/LICENSE-2.0
  17. *
  18. * Unless required by applicable law or agreed to in writing, software
  19. * distributed under the License is distributed on an AS IS BASIS, WITHOUT
  20. * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  21. * See the License for the specific language governing permissions and
  22. * limitations under the License.
  23. */
  24. #ifndef _ARM_MATH_UTILS_H_
  25. #define _ARM_MATH_UTILS_H_
  26. #include "arm_math_types.h"
  27. #ifdef __cplusplus
  28. extern "C"
  29. {
  30. #endif
  31. /**
  32. * @brief Macros required for reciprocal calculation in Normalized LMS
  33. */
  34. #define INDEX_MASK 0x0000003F
  35. #define SQ(x) ((x) * (x))
  36. #define CMSIS_ROUND_UP(N, S) ((((N) + (S) - 1) / (S)) * (S))
  37. /**
  38. * @brief Function to Calculates 1/in (reciprocal) value of Q31 Data type.
  39. */
  40. __STATIC_FORCEINLINE uint32_t arm_recip_q31(
  41. q31_t in,
  42. q31_t * dst,
  43. const q31_t * pRecipTable)
  44. {
  45. q31_t out;
  46. uint32_t tempVal;
  47. uint32_t index, i;
  48. uint32_t signBits;
  49. if (in > 0)
  50. {
  51. signBits = ((uint32_t) (__CLZ( in) - 1));
  52. }
  53. else
  54. {
  55. signBits = ((uint32_t) (__CLZ(-in) - 1));
  56. }
  57. /* Convert input sample to 1.31 format */
  58. in = (in << signBits);
  59. /* calculation of index for initial approximated Val */
  60. index = (uint32_t)(in >> 24);
  61. index = (index & INDEX_MASK);
  62. /* 1.31 with exp 1 */
  63. out = pRecipTable[index];
  64. /* calculation of reciprocal value */
  65. /* running approximation for two iterations */
  66. for (i = 0U; i < 2U; i++)
  67. {
  68. tempVal = (uint32_t) (((q63_t) in * out) >> 31);
  69. tempVal = 0x7FFFFFFFu - tempVal;
  70. /* 1.31 with exp 1 */
  71. /* out = (q31_t) (((q63_t) out * tempVal) >> 30); */
  72. out = clip_q63_to_q31(((q63_t) out * tempVal) >> 30);
  73. }
  74. /* write output */
  75. *dst = out;
  76. /* return num of signbits of out = 1/in value */
  77. return (signBits + 1U);
  78. }
  79. /**
  80. * @brief Function to Calculates 1/in (reciprocal) value of Q15 Data type.
  81. */
  82. __STATIC_FORCEINLINE uint32_t arm_recip_q15(
  83. q15_t in,
  84. q15_t * dst,
  85. const q15_t * pRecipTable)
  86. {
  87. q15_t out = 0;
  88. uint32_t tempVal = 0;
  89. uint32_t index = 0, i = 0;
  90. uint32_t signBits = 0;
  91. if (in > 0)
  92. {
  93. signBits = ((uint32_t)(__CLZ( in) - 17));
  94. }
  95. else
  96. {
  97. signBits = ((uint32_t)(__CLZ(-in) - 17));
  98. }
  99. /* Convert input sample to 1.15 format */
  100. in = (in << signBits);
  101. /* calculation of index for initial approximated Val */
  102. index = (uint32_t)(in >> 8);
  103. index = (index & INDEX_MASK);
  104. /* 1.15 with exp 1 */
  105. out = pRecipTable[index];
  106. /* calculation of reciprocal value */
  107. /* running approximation for two iterations */
  108. for (i = 0U; i < 2U; i++)
  109. {
  110. tempVal = (uint32_t) (((q31_t) in * out) >> 15);
  111. tempVal = 0x7FFFu - tempVal;
  112. /* 1.15 with exp 1 */
  113. out = (q15_t) (((q31_t) out * tempVal) >> 14);
  114. /* out = clip_q31_to_q15(((q31_t) out * tempVal) >> 14); */
  115. }
  116. /* write output */
  117. *dst = out;
  118. /* return num of signbits of out = 1/in value */
  119. return (signBits + 1);
  120. }
  121. /**
  122. * @brief 64-bit to 32-bit unsigned normalization
  123. * @param[in] in is input unsigned long long value
  124. * @param[out] normalized is the 32-bit normalized value
  125. * @param[out] norm is norm scale
  126. */
  127. __STATIC_INLINE void arm_norm_64_to_32u(uint64_t in, int32_t * normalized, int32_t *norm)
  128. {
  129. int32_t n1;
  130. int32_t hi = (int32_t) (in >> 32);
  131. int32_t lo = (int32_t) ((in << 32) >> 32);
  132. n1 = __CLZ(hi) - 32;
  133. if (!n1)
  134. {
  135. /*
  136. * input fits in 32-bit
  137. */
  138. n1 = __CLZ(lo);
  139. if (!n1)
  140. {
  141. /*
  142. * MSB set, need to scale down by 1
  143. */
  144. *norm = -1;
  145. *normalized = (((uint32_t) lo) >> 1);
  146. } else
  147. {
  148. if (n1 == 32)
  149. {
  150. /*
  151. * input is zero
  152. */
  153. *norm = 0;
  154. *normalized = 0;
  155. } else
  156. {
  157. /*
  158. * 32-bit normalization
  159. */
  160. *norm = n1 - 1;
  161. *normalized = lo << *norm;
  162. }
  163. }
  164. } else
  165. {
  166. /*
  167. * input fits in 64-bit
  168. */
  169. n1 = 1 - n1;
  170. *norm = -n1;
  171. /*
  172. * 64 bit normalization
  173. */
  174. *normalized = (((uint32_t) lo) >> n1) | (hi << (32 - n1));
  175. }
  176. }
  177. __STATIC_INLINE q31_t arm_div_q63_to_q31(q63_t num, q31_t den)
  178. {
  179. q31_t result;
  180. uint64_t absNum;
  181. int32_t normalized;
  182. int32_t norm;
  183. /*
  184. * if sum fits in 32bits
  185. * avoid costly 64-bit division
  186. */
  187. absNum = num > 0 ? num : -num;
  188. arm_norm_64_to_32u(absNum, &normalized, &norm);
  189. if (norm > 0)
  190. /*
  191. * 32-bit division
  192. */
  193. result = (q31_t) num / den;
  194. else
  195. /*
  196. * 64-bit division
  197. */
  198. result = (q31_t) (num / den);
  199. return result;
  200. }
  201. #ifdef __cplusplus
  202. }
  203. #endif
  204. #endif /*ifndef _ARM_MATH_UTILS_H_ */