A bundled STM32F10x Std Periph and CMSIS library
Vous ne pouvez pas sélectionner plus de 25 sujets Les noms de sujets doivent commencer par une lettre ou un nombre, peuvent contenir des tirets ('-') et peuvent comporter jusqu'à 35 caractères.
 
 
 
 
 

163 lignes
5.2 KiB

  1. /* ----------------------------------------------------------------------
  2. * Copyright (C) 2010-2014 ARM Limited. All rights reserved.
  3. *
  4. * $Date: 12. March 2014
  5. * $Revision: V1.4.4
  6. *
  7. * Project: CMSIS DSP Library
  8. * Title: arm_scale_q15.c
  9. *
  10. * Description: Multiplies a Q15 vector by a scalar.
  11. *
  12. * Target Processor: Cortex-M4/Cortex-M3/Cortex-M0
  13. *
  14. * Redistribution and use in source and binary forms, with or without
  15. * modification, are permitted provided that the following conditions
  16. * are met:
  17. * - Redistributions of source code must retain the above copyright
  18. * notice, this list of conditions and the following disclaimer.
  19. * - Redistributions in binary form must reproduce the above copyright
  20. * notice, this list of conditions and the following disclaimer in
  21. * the documentation and/or other materials provided with the
  22. * distribution.
  23. * - Neither the name of ARM LIMITED nor the names of its contributors
  24. * may be used to endorse or promote products derived from this
  25. * software without specific prior written permission.
  26. *
  27. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  28. * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  29. * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
  30. * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
  31. * COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
  32. * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
  33. * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  34. * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  35. * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  36. * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
  37. * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  38. * POSSIBILITY OF SUCH DAMAGE.
  39. * -------------------------------------------------------------------- */
  40. #include "arm_math.h"
  41. /**
  42. * @ingroup groupMath
  43. */
  44. /**
  45. * @addtogroup scale
  46. * @{
  47. */
  48. /**
  49. * @brief Multiplies a Q15 vector by a scalar.
  50. * @param[in] *pSrc points to the input vector
  51. * @param[in] scaleFract fractional portion of the scale value
  52. * @param[in] shift number of bits to shift the result by
  53. * @param[out] *pDst points to the output vector
  54. * @param[in] blockSize number of samples in the vector
  55. * @return none.
  56. *
  57. * <b>Scaling and Overflow Behavior:</b>
  58. * \par
  59. * The input data <code>*pSrc</code> and <code>scaleFract</code> are in 1.15 format.
  60. * These are multiplied to yield a 2.30 intermediate result and this is shifted with saturation to 1.15 format.
  61. */
  62. void arm_scale_q15(
  63. q15_t * pSrc,
  64. q15_t scaleFract,
  65. int8_t shift,
  66. q15_t * pDst,
  67. uint32_t blockSize)
  68. {
  69. int8_t kShift = 15 - shift; /* shift to apply after scaling */
  70. uint32_t blkCnt; /* loop counter */
  71. #ifndef ARM_MATH_CM0_FAMILY
  72. /* Run the below code for Cortex-M4 and Cortex-M3 */
  73. q15_t in1, in2, in3, in4;
  74. q31_t inA1, inA2; /* Temporary variables */
  75. q31_t out1, out2, out3, out4;
  76. /*loop Unrolling */
  77. blkCnt = blockSize >> 2u;
  78. /* First part of the processing with loop unrolling. Compute 4 outputs at a time.
  79. ** a second loop below computes the remaining 1 to 3 samples. */
  80. while(blkCnt > 0u)
  81. {
  82. /* Reading 2 inputs from memory */
  83. inA1 = *__SIMD32(pSrc)++;
  84. inA2 = *__SIMD32(pSrc)++;
  85. /* C = A * scale */
  86. /* Scale the inputs and then store the 2 results in the destination buffer
  87. * in single cycle by packing the outputs */
  88. out1 = (q31_t) ((q15_t) (inA1 >> 16) * scaleFract);
  89. out2 = (q31_t) ((q15_t) inA1 * scaleFract);
  90. out3 = (q31_t) ((q15_t) (inA2 >> 16) * scaleFract);
  91. out4 = (q31_t) ((q15_t) inA2 * scaleFract);
  92. /* apply shifting */
  93. out1 = out1 >> kShift;
  94. out2 = out2 >> kShift;
  95. out3 = out3 >> kShift;
  96. out4 = out4 >> kShift;
  97. /* saturate the output */
  98. in1 = (q15_t) (__SSAT(out1, 16));
  99. in2 = (q15_t) (__SSAT(out2, 16));
  100. in3 = (q15_t) (__SSAT(out3, 16));
  101. in4 = (q15_t) (__SSAT(out4, 16));
  102. /* store the result to destination */
  103. *__SIMD32(pDst)++ = __PKHBT(in2, in1, 16);
  104. *__SIMD32(pDst)++ = __PKHBT(in4, in3, 16);
  105. /* Decrement the loop counter */
  106. blkCnt--;
  107. }
  108. /* If the blockSize is not a multiple of 4, compute any remaining output samples here.
  109. ** No loop unrolling is used. */
  110. blkCnt = blockSize % 0x4u;
  111. while(blkCnt > 0u)
  112. {
  113. /* C = A * scale */
  114. /* Scale the input and then store the result in the destination buffer. */
  115. *pDst++ = (q15_t) (__SSAT(((*pSrc++) * scaleFract) >> kShift, 16));
  116. /* Decrement the loop counter */
  117. blkCnt--;
  118. }
  119. #else
  120. /* Run the below code for Cortex-M0 */
  121. /* Initialize blkCnt with number of samples */
  122. blkCnt = blockSize;
  123. while(blkCnt > 0u)
  124. {
  125. /* C = A * scale */
  126. /* Scale the input and then store the result in the destination buffer. */
  127. *pDst++ = (q15_t) (__SSAT(((q31_t) * pSrc++ * scaleFract) >> kShift, 16));
  128. /* Decrement the loop counter */
  129. blkCnt--;
  130. }
  131. #endif /* #ifndef ARM_MATH_CM0_FAMILY */
  132. }
  133. /**
  134. * @} end of scale group
  135. */