arm_bitreversal2.S 6.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228
  1. ;/* ----------------------------------------------------------------------
  2. ;* Copyright (C) 2010-2015 ARM Limited. All rights reserved.
  3. ;*
  4. ;* $Date: 21. December 2015
  5. ;* $Revision: V.1.4.5 a
  6. ;*
  7. ;* Project: CMSIS DSP Library
  8. ;* Title: arm_bitreversal2.S
  9. ;*
  10. ;* Description: This is the arm_bitreversal_32 function done in
  11. ;* assembly for maximum speed. This function is called
  12. ;* after doing an fft to reorder the output. The function
  13. ;* is loop unrolled by 2. arm_bitreversal_16 as well.
  14. ;*
  15. ;* Target Processor: Cortex-M4/Cortex-M3/Cortex-M0
  16. ;*
  17. ;* Redistribution and use in source and binary forms, with or without
  18. ;* modification, are permitted provided that the following conditions
  19. ;* are met:
  20. ;* - Redistributions of source code must retain the above copyright
  21. ;* notice, this list of conditions and the following disclaimer.
  22. ;* - Redistributions in binary form must reproduce the above copyright
  23. ;* notice, this list of conditions and the following disclaimer in
  24. ;* the documentation and/or other materials provided with the
  25. ;* distribution.
  26. ;* - Neither the name of ARM LIMITED nor the names of its contributors
  27. ;* may be used to endorse or promote products derived from this
  28. ;* software without specific prior written permission.
  29. ;*
  30. ;* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  31. ;* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  32. ;* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
  33. ;* FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
  34. ;* COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
  35. ;* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
  36. ;* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  37. ;* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  38. ;* CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  39. ;* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
  40. ;* ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  41. ;* POSSIBILITY OF SUCH DAMAGE.
  42. ;* -------------------------------------------------------------------- */
  43. #if defined ( __CC_ARM ) /* Keil */
  44. #define CODESECT AREA ||.text||, CODE, READONLY, ALIGN=2
  45. #define LABEL
  46. #elif defined ( __IASMARM__ ) /* IAR */
  47. #define CODESECT SECTION `.text`:CODE
  48. #define PROC
  49. #define LABEL
  50. #define ENDP
  51. #define EXPORT PUBLIC
  52. #elif defined ( __CSMC__ ) /* Cosmic */
  53. #define CODESECT switch .text
  54. #define THUMB
  55. #define EXPORT xdef
  56. #define PROC :
  57. #define LABEL :
  58. #define ENDP
  59. #define arm_bitreversal_32 _arm_bitreversal_32
  60. #elif defined ( __TI_ARM__ ) /* TI ARM */
  61. #define THUMB .thumb
  62. #define CODESECT .text
  63. #define EXPORT .global
  64. #define PROC : .asmfunc
  65. #define LABEL :
  66. #define ENDP .endasmfunc
  67. #define END
  68. #elif defined ( __GNUC__ ) /* GCC */
  69. #define THUMB .thumb
  70. #define CODESECT .section .text
  71. #define EXPORT .global
  72. #define PROC :
  73. #define LABEL :
  74. #define ENDP
  75. #define END
  76. .syntax unified
  77. #endif
  78. CODESECT
  79. THUMB
  80. ;/*
  81. ;* @brief In-place bit reversal function.
  82. ;* @param[in, out] *pSrc points to the in-place buffer of unknown 32-bit data type.
  83. ;* @param[in] bitRevLen bit reversal table length
  84. ;* @param[in] *pBitRevTab points to bit reversal table.
  85. ;* @return none.
  86. ;*/
  87. EXPORT arm_bitreversal_32
  88. EXPORT arm_bitreversal_16
  89. #if defined ( __CC_ARM ) /* Keil */
  90. #elif defined ( __IASMARM__ ) /* IAR */
  91. #elif defined ( __CSMC__ ) /* Cosmic */
  92. #elif defined ( __TI_ARM__ ) /* TI ARM */
  93. #elif defined ( __GNUC__ ) /* GCC */
  94. .type arm_bitreversal_16, %function
  95. .type arm_bitreversal_32, %function
  96. #endif
  97. #if defined(ARM_MATH_CM0) || defined(ARM_MATH_CM0PLUS)
  98. arm_bitreversal_32 PROC
  99. ADDS r3,r1,#1
  100. PUSH {r4-r6}
  101. ADDS r1,r2,#0
  102. LSRS r3,r3,#1
  103. arm_bitreversal_32_0 LABEL
  104. LDRH r2,[r1,#2]
  105. LDRH r6,[r1,#0]
  106. ADD r2,r0,r2
  107. ADD r6,r0,r6
  108. LDR r5,[r2,#0]
  109. LDR r4,[r6,#0]
  110. STR r5,[r6,#0]
  111. STR r4,[r2,#0]
  112. LDR r5,[r2,#4]
  113. LDR r4,[r6,#4]
  114. STR r5,[r6,#4]
  115. STR r4,[r2,#4]
  116. ADDS r1,r1,#4
  117. SUBS r3,r3,#1
  118. BNE arm_bitreversal_32_0
  119. POP {r4-r6}
  120. BX lr
  121. ENDP
  122. arm_bitreversal_16 PROC
  123. ADDS r3,r1,#1
  124. PUSH {r4-r6}
  125. ADDS r1,r2,#0
  126. LSRS r3,r3,#1
  127. arm_bitreversal_16_0 LABEL
  128. LDRH r2,[r1,#2]
  129. LDRH r6,[r1,#0]
  130. LSRS r2,r2,#1
  131. LSRS r6,r6,#1
  132. ADD r2,r0,r2
  133. ADD r6,r0,r6
  134. LDR r5,[r2,#0]
  135. LDR r4,[r6,#0]
  136. STR r5,[r6,#0]
  137. STR r4,[r2,#0]
  138. ADDS r1,r1,#4
  139. SUBS r3,r3,#1
  140. BNE arm_bitreversal_16_0
  141. POP {r4-r6}
  142. BX lr
  143. ENDP
  144. #else
  145. arm_bitreversal_32 PROC
  146. ADDS r3,r1,#1
  147. CMP r3,#1
  148. IT LS
  149. BXLS lr
  150. PUSH {r4-r9}
  151. ADDS r1,r2,#2
  152. LSRS r3,r3,#2
  153. arm_bitreversal_32_0 LABEL ;/* loop unrolled by 2 */
  154. LDRH r8,[r1,#4]
  155. LDRH r9,[r1,#2]
  156. LDRH r2,[r1,#0]
  157. LDRH r12,[r1,#-2]
  158. ADD r8,r0,r8
  159. ADD r9,r0,r9
  160. ADD r2,r0,r2
  161. ADD r12,r0,r12
  162. LDR r7,[r9,#0]
  163. LDR r6,[r8,#0]
  164. LDR r5,[r2,#0]
  165. LDR r4,[r12,#0]
  166. STR r6,[r9,#0]
  167. STR r7,[r8,#0]
  168. STR r5,[r12,#0]
  169. STR r4,[r2,#0]
  170. LDR r7,[r9,#4]
  171. LDR r6,[r8,#4]
  172. LDR r5,[r2,#4]
  173. LDR r4,[r12,#4]
  174. STR r6,[r9,#4]
  175. STR r7,[r8,#4]
  176. STR r5,[r12,#4]
  177. STR r4,[r2,#4]
  178. ADDS r1,r1,#8
  179. SUBS r3,r3,#1
  180. BNE arm_bitreversal_32_0
  181. POP {r4-r9}
  182. BX lr
  183. ENDP
  184. arm_bitreversal_16 PROC
  185. ADDS r3,r1,#1
  186. CMP r3,#1
  187. IT LS
  188. BXLS lr
  189. PUSH {r4-r9}
  190. ADDS r1,r2,#2
  191. LSRS r3,r3,#2
  192. arm_bitreversal_16_0 LABEL ;/* loop unrolled by 2 */
  193. LDRH r8,[r1,#4]
  194. LDRH r9,[r1,#2]
  195. LDRH r2,[r1,#0]
  196. LDRH r12,[r1,#-2]
  197. ADD r8,r0,r8,LSR #1
  198. ADD r9,r0,r9,LSR #1
  199. ADD r2,r0,r2,LSR #1
  200. ADD r12,r0,r12,LSR #1
  201. LDR r7,[r9,#0]
  202. LDR r6,[r8,#0]
  203. LDR r5,[r2,#0]
  204. LDR r4,[r12,#0]
  205. STR r6,[r9,#0]
  206. STR r7,[r8,#0]
  207. STR r5,[r12,#0]
  208. STR r4,[r2,#0]
  209. ADDS r1,r1,#8
  210. SUBS r3,r3,#1
  211. BNE arm_bitreversal_16_0
  212. POP {r4-r9}
  213. BX lr
  214. ENDP
  215. #endif
  216. END