genMVETwiddleCoefs.py 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456
  1. import numpy as np
  2. import math
  3. import argparse
  4. import sys
  5. sys.path.append("PatternGeneration")
  6. import Tools
  7. parser = argparse.ArgumentParser(description='Generate C arrays')
  8. parser.add_argument('-f', nargs='?',type = str, default="../Source/CommonTables/arm_mve_tables.c", help="C File path")
  9. parser.add_argument('-he', nargs='?',type = str, default="../Include/arm_mve_tables.h", help="H File path")
  10. args = parser.parse_args()
  11. COLLIM = 80
  12. condition="""#if !defined(ARM_DSP_CONFIG_TABLES) || defined(ARM_ALL_FFT_TABLES) || defined(ARM_TABLE_TWIDDLECOEF_%s_%d) || defined(ARM_TABLE_TWIDDLECOEF_%s_%d)
  13. """
  14. F32 = 1
  15. Q31 = 2
  16. Q15 = 3
  17. Q7 = 4
  18. def printCUInt32Array(f,name,arr):
  19. nb = 0
  20. print("uint32_t %s[%d]={" % (name,len(arr)),file=f)
  21. for d in arr:
  22. val = "%d," % d
  23. nb = nb + len(val)
  24. if nb > COLLIM:
  25. print("",file=f)
  26. nb = len(val)
  27. print(val,end="",file=f)
  28. print("};\n",file=f)
  29. def printCFloat32Array(f,name,arr):
  30. nb = 0
  31. print("float32_t %s[%d]={" % (name,len(arr)),file=f)
  32. for d in arr:
  33. val = "%.20ff," % d
  34. nb = nb + len(val)
  35. if nb > COLLIM:
  36. print("",file=f)
  37. nb = len(val)
  38. print(val,end="",file=f)
  39. print("};\n",file=f)
  40. def printCQ31Array(f,name,arr):
  41. nb = 0
  42. print("q31_t %s[%d]={" % (name,len(arr)),file=f)
  43. for d in arr:
  44. val = "%s," % Tools.to_q31(d)
  45. nb = nb + len(val)
  46. if nb > COLLIM:
  47. print("",file=f)
  48. nb = len(val)
  49. print(val,end="",file=f)
  50. print("};\n",file=f)
  51. def printCQ15Array(f,name,arr):
  52. nb = 0
  53. print("q15_t %s[%d]={" % (name,len(arr)),file=f)
  54. for d in arr:
  55. val = "%s," % Tools.to_q15(d)
  56. nb = nb + len(val)
  57. if nb > COLLIM:
  58. print("",file=f)
  59. nb = len(val)
  60. print(val,end="",file=f)
  61. print("};\n",file=f)
  62. def printCQ7Array(f,name,arr):
  63. nb = 0
  64. print("q7_t %s[%d]={" % (name,len(arr)),file=f)
  65. for d in arr:
  66. val = "%s," % Tools.to_q7(d)
  67. nb = nb + len(val)
  68. if nb > COLLIM:
  69. print("",file=f)
  70. nb = len(val)
  71. print(val,end="",file=f)
  72. print("};\n",file=f)
  73. def printHUInt32Array(f,name,arr):
  74. print("extern uint32_t %s[%d];" % (name,len(arr)),file=f)
  75. def printHFloat32Array(f,name,arr):
  76. print("extern float32_t %s[%d];" % (name,len(arr)),file=f)
  77. def printHQ31Array(f,name,arr):
  78. print("extern q31_t %s[%d];" % (name,len(arr)),file=f)
  79. def printHQ15Array(f,name,arr):
  80. print("extern q15_t %s[%d];" % (name,len(arr)),file=f)
  81. def printHQ7Array(f,name,arr):
  82. print("extern q7_t %s[%d];" % (name,len(arr)),file=f)
  83. def twiddle(n):
  84. a=2.0*math.pi*np.linspace(0,n,num=n,endpoint=False)/n
  85. c=np.cos(a)
  86. s=np.sin(a)
  87. r = np.empty((c.size + s.size,), dtype=c.dtype)
  88. r[0::2] = c
  89. r[1::2] = s
  90. return(r)
  91. def reorderTwiddle(theType,conjugate,f,h,n):
  92. numStages = 6
  93. coefs= twiddle(n)
  94. if n == 4096:
  95. numStages = 6
  96. arraySize = 1364
  97. if n == 1024:
  98. numStages = 5
  99. arraySize = 340
  100. if n == 256:
  101. numStages = 4
  102. arraySize = 84
  103. if n == 64:
  104. numStages = 3
  105. arraySize = 20
  106. if n == 16:
  107. numStages = 2
  108. arraySize = 4
  109. incr = 1
  110. nbOfElt = n
  111. maxNb = 0
  112. tab1 = np.zeros(2*arraySize)
  113. tab2 = np.zeros(2*arraySize)
  114. tab3 = np.zeros(2*arraySize)
  115. tab1Index=0
  116. tab2Index=0
  117. tab3Index=0
  118. tab1Offset = np.zeros(numStages)
  119. tab2Offset = np.zeros(numStages)
  120. tab3Offset = np.zeros(numStages)
  121. for stage in range(0,numStages-1):
  122. nbOfElt = nbOfElt >> 2
  123. pVectCoef1 = 0
  124. pVectCoef2 = 0
  125. pVectCoef3 = 0
  126. tab1Offset[stage] = tab1Index
  127. tab2Offset[stage] = tab2Index
  128. tab3Offset[stage] = tab3Index
  129. for i in range(0,nbOfElt):
  130. tab1[tab1Index] = coefs[pVectCoef1]
  131. if not conjugate:
  132. tab1[tab1Index + 1] = coefs[pVectCoef1 + 1]
  133. else:
  134. tab1[tab1Index + 1] = -coefs[pVectCoef1 + 1]
  135. tab1Index = tab1Index + 2
  136. pVectCoef1 = pVectCoef1 + (incr * 1 * 2)
  137. tab2[tab2Index] = coefs[pVectCoef2]
  138. if not conjugate:
  139. tab2[tab2Index + 1] = coefs[pVectCoef2 + 1]
  140. else:
  141. tab2[tab2Index + 1] = -coefs[pVectCoef2 + 1]
  142. tab2Index = tab2Index + 2
  143. pVectCoef2 = pVectCoef2 + (incr * 2 * 2)
  144. tab3[tab3Index] = coefs[pVectCoef3]
  145. if not conjugate:
  146. tab3[tab3Index + 1] = coefs[pVectCoef3 + 1]
  147. else:
  148. tab3[tab3Index + 1] = -coefs[pVectCoef3 + 1]
  149. tab3Index = tab3Index + 2
  150. pVectCoef3 = pVectCoef3 + (incr * 3 * 2)
  151. maxNb = maxNb + 1
  152. incr = 4 * incr
  153. # F32 SECTION FOR THIS FFT LENGTH
  154. if theType == F32:
  155. print(condition % ("F32",n, "F32",n << 1),file=f)
  156. print(condition % ("F32",n, "F32",n << 1),file=h)
  157. printCUInt32Array(f,"rearranged_twiddle_tab_stride1_arr_%d_f32" % n,list(tab1Offset))
  158. printHUInt32Array(h,"rearranged_twiddle_tab_stride1_arr_%d_f32" % n,list(tab1Offset))
  159. printCUInt32Array(f,"rearranged_twiddle_tab_stride2_arr_%d_f32" % n,list(tab2Offset))
  160. printHUInt32Array(h,"rearranged_twiddle_tab_stride2_arr_%d_f32" % n,list(tab2Offset))
  161. printCUInt32Array(f,"rearranged_twiddle_tab_stride3_arr_%d_f32" % n,list(tab3Offset))
  162. printHUInt32Array(h,"rearranged_twiddle_tab_stride3_arr_%d_f32" % n,list(tab3Offset))
  163. printCFloat32Array(f,"rearranged_twiddle_stride1_%d_f32" % n,list(tab1))
  164. printHFloat32Array(h,"rearranged_twiddle_stride1_%d_f32" % n,list(tab1))
  165. printCFloat32Array(f,"rearranged_twiddle_stride2_%d_f32" % n,list(tab2))
  166. printHFloat32Array(h,"rearranged_twiddle_stride2_%d_f32" % n,list(tab2))
  167. printCFloat32Array(f,"rearranged_twiddle_stride3_%d_f32" % n,list(tab3))
  168. printHFloat32Array(h,"rearranged_twiddle_stride3_%d_f32" % n,list(tab3))
  169. print("#endif\n",file=f)
  170. print("#endif\n",file=h)
  171. # Q31 SECTION FOR THIS FFT LENGTH
  172. if theType == Q31:
  173. print(condition % ("Q31",n, "Q31",n << 1),file=f)
  174. print(condition % ("Q31",n, "Q31",n << 1),file=h)
  175. printCUInt32Array(f,"rearranged_twiddle_tab_stride1_arr_%d_q31" % n,list(tab1Offset))
  176. printHUInt32Array(h,"rearranged_twiddle_tab_stride1_arr_%d_q31" % n,list(tab1Offset))
  177. printCUInt32Array(f,"rearranged_twiddle_tab_stride2_arr_%d_q31" % n,list(tab2Offset))
  178. printHUInt32Array(h,"rearranged_twiddle_tab_stride2_arr_%d_q31" % n,list(tab2Offset))
  179. printCUInt32Array(f,"rearranged_twiddle_tab_stride3_arr_%d_q31" % n,list(tab3Offset))
  180. printHUInt32Array(h,"rearranged_twiddle_tab_stride3_arr_%d_q31" % n,list(tab3Offset))
  181. printCQ31Array(f,"rearranged_twiddle_stride1_%d_q31" % n,list(tab1))
  182. printHQ31Array(h,"rearranged_twiddle_stride1_%d_q31" % n,list(tab1))
  183. printCQ31Array(f,"rearranged_twiddle_stride2_%d_q31" % n,list(tab2))
  184. printHQ31Array(h,"rearranged_twiddle_stride2_%d_q31" % n,list(tab2))
  185. printCQ31Array(f,"rearranged_twiddle_stride3_%d_q31" % n,list(tab3))
  186. printHQ31Array(h,"rearranged_twiddle_stride3_%d_q31" % n,list(tab3))
  187. print("#endif\n",file=f)
  188. print("#endif\n",file=h)
  189. # Q15 SECTION FOR THIS FFT LENGTH
  190. if theType == Q15:
  191. print(condition % ("Q15",n, "Q15",n << 1),file=f)
  192. print(condition % ("Q15",n, "Q15",n << 1),file=h)
  193. printCUInt32Array(f,"rearranged_twiddle_tab_stride1_arr_%d_q15" % n,list(tab1Offset))
  194. printHUInt32Array(h,"rearranged_twiddle_tab_stride1_arr_%d_q15" % n,list(tab1Offset))
  195. printCUInt32Array(f,"rearranged_twiddle_tab_stride2_arr_%d_q15" % n,list(tab2Offset))
  196. printHUInt32Array(h,"rearranged_twiddle_tab_stride2_arr_%d_q15" % n,list(tab2Offset))
  197. printCUInt32Array(f,"rearranged_twiddle_tab_stride3_arr_%d_q15" % n,list(tab3Offset))
  198. printHUInt32Array(h,"rearranged_twiddle_tab_stride3_arr_%d_q15" % n,list(tab3Offset))
  199. printCQ15Array(f,"rearranged_twiddle_stride1_%d_q15" % n,list(tab1))
  200. printHQ15Array(h,"rearranged_twiddle_stride1_%d_q15" % n,list(tab1))
  201. printCQ15Array(f,"rearranged_twiddle_stride2_%d_q15" % n,list(tab2))
  202. printHQ15Array(h,"rearranged_twiddle_stride2_%d_q15" % n,list(tab2))
  203. printCQ15Array(f,"rearranged_twiddle_stride3_%d_q15" % n,list(tab3))
  204. printHQ15Array(h,"rearranged_twiddle_stride3_%d_q15" % n,list(tab3))
  205. print("#endif\n",file=f)
  206. print("#endif\n",file=h)
  207. #test = twiddle(16)
  208. #printCFloat32Array("Test",list(test))
  209. cheader="""/* ----------------------------------------------------------------------
  210. * Project: CMSIS DSP Library
  211. * Title: arm_mve_tables.c
  212. * Description: common tables like fft twiddle factors, Bitreverse, reciprocal etc
  213. * used for MVE implementation only
  214. *
  215. * $Date: 08. January 2020
  216. * $Revision: V1.7.0
  217. *
  218. * Target Processor: Cortex-M cores
  219. * -------------------------------------------------------------------- */
  220. /*
  221. * Copyright (C) 2010-2020 ARM Limited or its affiliates. All rights reserved.
  222. *
  223. * SPDX-License-Identifier: Apache-2.0
  224. *
  225. * Licensed under the Apache License, Version 2.0 (the License); you may
  226. * not use this file except in compliance with the License.
  227. * You may obtain a copy of the License at
  228. *
  229. * www.apache.org/licenses/LICENSE-2.0
  230. *
  231. * Unless required by applicable law or agreed to in writing, software
  232. * distributed under the License is distributed on an AS IS BASIS, WITHOUT
  233. * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  234. * See the License for the specific language governing permissions and
  235. * limitations under the License.
  236. */
  237. """
  238. cifdeMVEF="""#include "arm_math.h"
  239. #if defined(ARM_MATH_MVEF) && !defined(ARM_MATH_AUTOVECTORIZE)
  240. #if !defined(ARM_DSP_CONFIG_TABLES) || defined(ARM_FFT_ALLOW_TABLES)
  241. """
  242. cfooterMVEF="""
  243. #endif /* !defined(ARM_DSP_CONFIG_TABLES) || defined(ARM_FFT_ALLOW_TABLES) */
  244. #endif /* defined(ARM_MATH_MVEF) && !defined(ARM_MATH_AUTOVECTORIZE) */
  245. """
  246. cifdeMVEI="""#include "arm_math.h"
  247. #if defined(ARM_MATH_MVEI)
  248. #if !defined(ARM_DSP_CONFIG_TABLES) || defined(ARM_FFT_ALLOW_TABLES)
  249. """
  250. cfooterMVEI="""
  251. #endif /* !defined(ARM_DSP_CONFIG_TABLES) || defined(ARM_FFT_ALLOW_TABLES) */
  252. #endif /* defined(ARM_MATH_MVEI) */
  253. """
  254. hheader="""/* ----------------------------------------------------------------------
  255. * Project: CMSIS DSP Library
  256. * Title: arm_mve_tables.h
  257. * Description: common tables like fft twiddle factors, Bitreverse, reciprocal etc
  258. * used for MVE implementation only
  259. *
  260. * $Date: 08. January 2020
  261. * $Revision: V1.7.0
  262. *
  263. * Target Processor: Cortex-M cores
  264. * -------------------------------------------------------------------- */
  265. /*
  266. * Copyright (C) 2010-2020 ARM Limited or its affiliates. All rights reserved.
  267. *
  268. * SPDX-License-Identifier: Apache-2.0
  269. *
  270. * Licensed under the Apache License, Version 2.0 (the License); you may
  271. * not use this file except in compliance with the License.
  272. * You may obtain a copy of the License at
  273. *
  274. * www.apache.org/licenses/LICENSE-2.0
  275. *
  276. * Unless required by applicable law or agreed to in writing, software
  277. * distributed under the License is distributed on an AS IS BASIS, WITHOUT
  278. * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  279. * See the License for the specific language governing permissions and
  280. * limitations under the License.
  281. */
  282. #ifndef _ARM_MVE_TABLES_H
  283. #define _ARM_MVE_TABLES_H
  284. #include "arm_math.h"
  285. """
  286. hifdefMVEF="""
  287. #if defined(ARM_MATH_MVEF) && !defined(ARM_MATH_AUTOVECTORIZE)
  288. #if !defined(ARM_DSP_CONFIG_TABLES) || defined(ARM_FFT_ALLOW_TABLES)
  289. """
  290. hfooterMVEF="""
  291. #endif /* !defined(ARM_DSP_CONFIG_TABLES) || defined(ARM_FFT_ALLOW_TABLES) */
  292. #endif /* defined(ARM_MATH_MVEF) && !defined(ARM_MATH_AUTOVECTORIZE) */
  293. """
  294. hifdefMVEI="""
  295. #if defined(ARM_MATH_MVEI)
  296. #if !defined(ARM_DSP_CONFIG_TABLES) || defined(ARM_FFT_ALLOW_TABLES)
  297. """
  298. hfooterMVEI="""
  299. #endif /* !defined(ARM_DSP_CONFIG_TABLES) || defined(ARM_FFT_ALLOW_TABLES) */
  300. #endif /* defined(ARM_MATH_MVEI) */
  301. """
  302. hfooter="""
  303. #endif /*_ARM_MVE_TABLES_H*/
  304. """
  305. with open(args.f,'w') as f:
  306. with open(args.he,'w') as h:
  307. print(cheader,file=f)
  308. print(hheader,file=h)
  309. print(cifdeMVEF,file=f)
  310. print(hifdefMVEF,file=h)
  311. reorderTwiddle(F32,False,f,h,16)
  312. reorderTwiddle(F32,False,f,h,64)
  313. reorderTwiddle(F32,False,f,h,256)
  314. reorderTwiddle(F32,False,f,h,1024)
  315. reorderTwiddle(F32,False,f,h,4096)
  316. print(cfooterMVEF,file=f)
  317. print(hfooterMVEF,file=h)
  318. print(cifdeMVEI,file=f)
  319. print(hifdefMVEI,file=h)
  320. reorderTwiddle(Q31,True,f,h,16)
  321. reorderTwiddle(Q31,True,f,h,64)
  322. reorderTwiddle(Q31,True,f,h,256)
  323. reorderTwiddle(Q31,True,f,h,1024)
  324. reorderTwiddle(Q31,True,f,h,4096)
  325. print(cfooterMVEI,file=f)
  326. print(hfooterMVEI,file=h)
  327. print(cifdeMVEI,file=f)
  328. print(hifdefMVEI,file=h)
  329. reorderTwiddle(Q15,True,f,h,16)
  330. reorderTwiddle(Q15,True,f,h,64)
  331. reorderTwiddle(Q15,True,f,h,256)
  332. reorderTwiddle(Q15,True,f,h,1024)
  333. reorderTwiddle(Q15,True,f,h,4096)
  334. print(cfooterMVEI,file=f)
  335. print(hfooterMVEI,file=h)
  336. print(cifdeMVEI,file=f)
  337. print(hifdefMVEI,file=h)
  338. reorderTwiddle(Q7,True,f,h,16)
  339. reorderTwiddle(Q7,True,f,h,64)
  340. reorderTwiddle(Q7,True,f,h,256)
  341. reorderTwiddle(Q7,True,f,h,1024)
  342. reorderTwiddle(Q7,True,f,h,4096)
  343. print(cfooterMVEI,file=f)
  344. print(hfooterMVEI,file=h)
  345. print(hfooter,file=h)