xnnpack.patch 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742
  1. diff --git a/.bazelrc b/.bazelrc
  2. index ea28201..ffd4ed4 100644
  3. --- a/.bazelrc
  4. +++ b/.bazelrc
  5. @@ -44,3 +44,7 @@ build:ios_arm64e --watchos_cpus=armv7k
  6. build:ios_fat --config=ios
  7. build:ios_fat --ios_multi_cpus=armv7,arm64
  8. build:ios_fat --watchos_cpus=armv7k
  9. +
  10. +# WASM configs
  11. +build:emscripten_wasm --cpu=wasm
  12. +build:emscripten_wasm --crosstool_top=//toolchain:emscripten
  13. diff --git a/BUILD.bazel b/BUILD.bazel
  14. index d38ef1e..f261eb5 100644
  15. --- a/BUILD.bazel
  16. +++ b/BUILD.bazel
  17. @@ -3228,13 +3228,19 @@ xnnpack_cc_library(
  18. hdrs = INTERNAL_HDRS,
  19. gcc_copts = xnnpack_gcc_std_copts(),
  20. msvc_copts = xnnpack_msvc_std_copts(),
  21. - wasm_srcs = WASM_UKERNELS,
  22. - wasmsimd_srcs = WASM_UKERNELS + WASMSIMD_UKERNELS,
  23. + optimized_copts = [
  24. + "-ffast-math",
  25. + ],
  26. + wasm_srcs = WASM_UKERNELS + WASMSIMD_UKERNELS +
  27. + PSIMD_FASTMATH_UKERNELS + PSIMD_ACCMATH_UKERNELS,
  28. + wasmsimd_srcs = WASM_UKERNELS + WASMSIMD_UKERNELS +
  29. + PSIMD_FASTMATH_UKERNELS + PSIMD_ACCMATH_UKERNELS,
  30. deps = [
  31. ":tables",
  32. "@FP16",
  33. "@FXdiv",
  34. "@pthreadpool",
  35. + "@psimd",
  36. ],
  37. )
  38. @@ -3247,13 +3253,19 @@ xnnpack_cc_library(
  39. ],
  40. gcc_copts = xnnpack_gcc_std_copts(),
  41. msvc_copts = xnnpack_msvc_std_copts(),
  42. - wasm_srcs = WASM_UKERNELS,
  43. - wasmsimd_srcs = WASM_UKERNELS + WASMSIMD_UKERNELS,
  44. + optimized_copts = [
  45. + "-ffast-math",
  46. + ],
  47. + wasm_srcs = WASM_UKERNELS + WASMSIMD_UKERNELS +
  48. + PSIMD_FASTMATH_UKERNELS + PSIMD_ACCMATH_UKERNELS,
  49. + wasmsimd_srcs = WASM_UKERNELS + WASMSIMD_UKERNELS +
  50. + PSIMD_FASTMATH_UKERNELS + PSIMD_ACCMATH_UKERNELS,
  51. deps = [
  52. ":tables",
  53. "@FP16",
  54. "@FXdiv",
  55. "@pthreadpool",
  56. + "@psimd",
  57. ],
  58. )
  59. @@ -4495,7 +4507,7 @@ xnnpack_cc_library(
  60. ######################### Benchmarks for micro-kernels #########################
  61. xnnpack_benchmark(
  62. - name = "qs8_gemm_bench",
  63. + name = "qs8_gemm_bench.wasm",
  64. srcs = [
  65. "bench/gemm.h",
  66. "bench/qs8-gemm.cc",
  67. @@ -4506,7 +4518,7 @@ xnnpack_benchmark(
  68. )
  69. xnnpack_benchmark(
  70. - name = "qs8_requantization_bench",
  71. + name = "qs8_requantization_bench.wasm",
  72. srcs = [
  73. "bench/qs8-requantization.cc",
  74. "src/xnnpack/AlignedAllocator.h",
  75. @@ -4516,7 +4528,7 @@ xnnpack_benchmark(
  76. )
  77. xnnpack_benchmark(
  78. - name = "qu8_gemm_bench",
  79. + name = "qu8_gemm_bench.wasm",
  80. srcs = [
  81. "bench/gemm.h",
  82. "bench/qu8-gemm.cc",
  83. @@ -4527,7 +4539,7 @@ xnnpack_benchmark(
  84. )
  85. xnnpack_benchmark(
  86. - name = "qu8_requantization_bench",
  87. + name = "qu8_requantization_bench.wasm",
  88. srcs = [
  89. "bench/qu8-requantization.cc",
  90. "src/xnnpack/AlignedAllocator.h",
  91. @@ -4537,11 +4549,11 @@ xnnpack_benchmark(
  92. )
  93. xnnpack_benchmark(
  94. - name = "f16_igemm_bench",
  95. + name = "f16_igemm_bench.wasm",
  96. srcs = [
  97. "bench/f16-igemm.cc",
  98. "bench/conv.h",
  99. - "bench/google/conv.h",
  100. + #"bench/google/conv.h",
  101. "src/xnnpack/AlignedAllocator.h",
  102. ] + MICROKERNEL_BENCHMARK_HDRS,
  103. deps = MICROKERNEL_BENCHMARK_DEPS + [
  104. @@ -4551,7 +4563,7 @@ xnnpack_benchmark(
  105. )
  106. xnnpack_benchmark(
  107. - name = "f16_gemm_bench",
  108. + name = "f16_gemm_bench.wasm",
  109. srcs = [
  110. "bench/f16-gemm.cc",
  111. "bench/gemm.h",
  112. @@ -4563,7 +4575,7 @@ xnnpack_benchmark(
  113. )
  114. xnnpack_benchmark(
  115. - name = "f16_spmm_bench",
  116. + name = "f16_spmm_bench.wasm",
  117. srcs = [
  118. "bench/f16-spmm.cc",
  119. "bench/gemm.h",
  120. @@ -4573,7 +4585,7 @@ xnnpack_benchmark(
  121. )
  122. xnnpack_benchmark(
  123. - name = "f32_igemm_bench",
  124. + name = "f32_igemm_bench.wasm",
  125. srcs = [
  126. "bench/f32-igemm.cc",
  127. "bench/conv.h",
  128. @@ -4586,7 +4598,7 @@ xnnpack_benchmark(
  129. )
  130. xnnpack_benchmark(
  131. - name = "f16_relu_bench",
  132. + name = "f16_relu_bench.wasm",
  133. srcs = [
  134. "bench/f16-relu.cc",
  135. "src/xnnpack/AlignedAllocator.h",
  136. @@ -4595,7 +4607,7 @@ xnnpack_benchmark(
  137. )
  138. xnnpack_benchmark(
  139. - name = "f32_conv_hwc_bench",
  140. + name = "f32_conv_hwc_bench.wasm",
  141. srcs = [
  142. "bench/f32-conv-hwc.cc",
  143. "bench/dconv.h",
  144. @@ -4607,7 +4619,7 @@ xnnpack_benchmark(
  145. )
  146. xnnpack_benchmark(
  147. - name = "f32_conv_hwc2chw_bench",
  148. + name = "f32_conv_hwc2chw_bench.wasm",
  149. srcs = [
  150. "bench/f32-conv-hwc2chw.cc",
  151. "bench/dconv.h",
  152. @@ -4619,11 +4631,11 @@ xnnpack_benchmark(
  153. )
  154. xnnpack_benchmark(
  155. - name = "f16_dwconv_bench",
  156. + name = "f16_dwconv_bench.wasm",
  157. srcs = [
  158. "bench/f16-dwconv.cc",
  159. "bench/dwconv.h",
  160. - "bench/google/dwconv.h",
  161. + #"bench/google/dwconv.h",
  162. "src/xnnpack/AlignedAllocator.h",
  163. ] + MICROKERNEL_BENCHMARK_HDRS,
  164. deps = MICROKERNEL_BENCHMARK_DEPS + [
  165. @@ -4633,7 +4645,7 @@ xnnpack_benchmark(
  166. )
  167. xnnpack_benchmark(
  168. - name = "f32_dwconv_bench",
  169. + name = "f32_dwconv_bench.wasm",
  170. srcs = [
  171. "bench/f32-dwconv.cc",
  172. "bench/dwconv.h",
  173. @@ -4646,7 +4658,7 @@ xnnpack_benchmark(
  174. )
  175. xnnpack_benchmark(
  176. - name = "f32_dwconv2d_chw_bench",
  177. + name = "f32_dwconv2d_chw_bench.wasm",
  178. srcs = [
  179. "bench/f32-dwconv2d-chw.cc",
  180. "bench/dwconv.h",
  181. @@ -4659,7 +4671,7 @@ xnnpack_benchmark(
  182. )
  183. xnnpack_benchmark(
  184. - name = "f32_gemm_bench",
  185. + name = "f32_gemm_bench.wasm",
  186. srcs = [
  187. "bench/f32-gemm.cc",
  188. "bench/gemm.h",
  189. @@ -4670,7 +4682,7 @@ xnnpack_benchmark(
  190. )
  191. xnnpack_benchmark(
  192. - name = "f32_hswish_bench",
  193. + name = "f32_hswish_bench.wasm",
  194. srcs = [
  195. "bench/f32-hswish.cc",
  196. "src/xnnpack/AlignedAllocator.h",
  197. @@ -4679,7 +4691,7 @@ xnnpack_benchmark(
  198. )
  199. xnnpack_benchmark(
  200. - name = "f32_raddexpminusmax_bench",
  201. + name = "f32_raddexpminusmax_bench.wasm",
  202. srcs = [
  203. "bench/f32-raddexpminusmax.cc",
  204. "src/xnnpack/AlignedAllocator.h",
  205. @@ -4688,7 +4700,7 @@ xnnpack_benchmark(
  206. )
  207. xnnpack_benchmark(
  208. - name = "f32_raddextexp_bench",
  209. + name = "f32_raddextexp_bench.wasm",
  210. srcs = [
  211. "bench/f32-raddextexp.cc",
  212. "src/xnnpack/AlignedAllocator.h",
  213. @@ -4697,7 +4709,7 @@ xnnpack_benchmark(
  214. )
  215. xnnpack_benchmark(
  216. - name = "f32_raddstoreexpminusmax_bench",
  217. + name = "f32_raddstoreexpminusmax_bench.wasm",
  218. srcs = [
  219. "bench/f32-raddstoreexpminusmax.cc",
  220. "src/xnnpack/AlignedAllocator.h",
  221. @@ -4706,7 +4718,7 @@ xnnpack_benchmark(
  222. )
  223. xnnpack_benchmark(
  224. - name = "f32_relu_bench",
  225. + name = "f32_relu_bench.wasm",
  226. srcs = [
  227. "bench/f32-relu.cc",
  228. "src/xnnpack/AlignedAllocator.h",
  229. @@ -4715,7 +4727,7 @@ xnnpack_benchmark(
  230. )
  231. xnnpack_benchmark(
  232. - name = "f32_rmax_bench",
  233. + name = "f32_rmax_bench.wasm",
  234. srcs = [
  235. "bench/f32-rmax.cc",
  236. "src/xnnpack/AlignedAllocator.h",
  237. @@ -4724,7 +4736,7 @@ xnnpack_benchmark(
  238. )
  239. xnnpack_benchmark(
  240. - name = "f32_sigmoid_bench",
  241. + name = "f32_sigmoid_bench.wasm",
  242. srcs = [
  243. "bench/f32-sigmoid.cc",
  244. "src/xnnpack/AlignedAllocator.h",
  245. @@ -4733,7 +4745,7 @@ xnnpack_benchmark(
  246. )
  247. xnnpack_benchmark(
  248. - name = "f32_spmm_bench",
  249. + name = "f32_spmm_bench.wasm",
  250. srcs = [
  251. "bench/f32-spmm.cc",
  252. "bench/gemm.h",
  253. @@ -4743,7 +4755,7 @@ xnnpack_benchmark(
  254. )
  255. xnnpack_benchmark(
  256. - name = "f32_softmax_bench",
  257. + name = "f32_softmax_bench.wasm",
  258. srcs = [
  259. "bench/f32-softmax.cc",
  260. ] + MICROKERNEL_BENCHMARK_HDRS,
  261. @@ -4752,7 +4764,7 @@ xnnpack_benchmark(
  262. )
  263. xnnpack_benchmark(
  264. - name = "f32_vscaleexpminusmax_bench",
  265. + name = "f32_vscaleexpminusmax_bench.wasm",
  266. srcs = [
  267. "bench/f32-vscaleexpminusmax.cc",
  268. "src/xnnpack/AlignedAllocator.h",
  269. @@ -4761,7 +4773,7 @@ xnnpack_benchmark(
  270. )
  271. xnnpack_benchmark(
  272. - name = "f32_vscaleextexp_bench",
  273. + name = "f32_vscaleextexp_bench.wasm",
  274. srcs = [
  275. "bench/f32-vscaleextexp.cc",
  276. "src/xnnpack/AlignedAllocator.h",
  277. @@ -4770,7 +4782,7 @@ xnnpack_benchmark(
  278. )
  279. xnnpack_benchmark(
  280. - name = "f32_vsqrt_bench",
  281. + name = "f32_vsqrt_bench.wasm",
  282. srcs = [
  283. "bench/f32-vsqrt.cc",
  284. "src/xnnpack/AlignedAllocator.h",
  285. @@ -4779,7 +4791,7 @@ xnnpack_benchmark(
  286. )
  287. xnnpack_benchmark(
  288. - name = "f32_im2col_gemm_bench",
  289. + name = "f32_im2col_gemm_bench.wasm",
  290. srcs = [
  291. "bench/f32-im2col-gemm.cc",
  292. "bench/conv.h",
  293. @@ -4792,7 +4804,7 @@ xnnpack_benchmark(
  294. )
  295. xnnpack_benchmark(
  296. - name = "rounding_bench",
  297. + name = "rounding_bench.wasm",
  298. srcs = [
  299. "bench/rounding.cc",
  300. "src/xnnpack/AlignedAllocator.h",
  301. @@ -4804,7 +4816,7 @@ xnnpack_benchmark(
  302. ########################### Benchmarks for operators ###########################
  303. xnnpack_benchmark(
  304. - name = "average_pooling_bench",
  305. + name = "average_pooling_bench.wasm",
  306. srcs = ["bench/average-pooling.cc"],
  307. copts = xnnpack_optional_tflite_copts(),
  308. tags = ["nowin32"],
  309. @@ -4812,7 +4824,7 @@ xnnpack_benchmark(
  310. )
  311. xnnpack_benchmark(
  312. - name = "bankers_rounding_bench",
  313. + name = "bankers_rounding_bench.wasm",
  314. srcs = ["bench/bankers-rounding.cc"],
  315. copts = xnnpack_optional_tflite_copts(),
  316. tags = ["nowin32"],
  317. @@ -4820,7 +4832,7 @@ xnnpack_benchmark(
  318. )
  319. xnnpack_benchmark(
  320. - name = "ceiling_bench",
  321. + name = "ceiling_bench.wasm",
  322. srcs = ["bench/ceiling.cc"],
  323. copts = xnnpack_optional_tflite_copts(),
  324. tags = ["nowin32"],
  325. @@ -4828,13 +4840,13 @@ xnnpack_benchmark(
  326. )
  327. xnnpack_benchmark(
  328. - name = "channel_shuffle_bench",
  329. + name = "channel_shuffle_bench.wasm",
  330. srcs = ["bench/channel-shuffle.cc"],
  331. deps = OPERATOR_BENCHMARK_DEPS,
  332. )
  333. xnnpack_benchmark(
  334. - name = "convolution_bench",
  335. + name = "convolution_bench.wasm",
  336. srcs = ["bench/convolution.cc"],
  337. copts = xnnpack_optional_tflite_copts() + xnnpack_optional_armcl_copts(),
  338. tags = ["nowin32"],
  339. @@ -4842,7 +4854,7 @@ xnnpack_benchmark(
  340. )
  341. xnnpack_benchmark(
  342. - name = "deconvolution_bench",
  343. + name = "deconvolution_bench.wasm",
  344. srcs = ["bench/deconvolution.cc"],
  345. copts = xnnpack_optional_tflite_copts(),
  346. tags = ["nowin32"],
  347. @@ -4850,7 +4862,7 @@ xnnpack_benchmark(
  348. )
  349. xnnpack_benchmark(
  350. - name = "floor_bench",
  351. + name = "floor_bench.wasm",
  352. srcs = ["bench/floor.cc"],
  353. copts = xnnpack_optional_tflite_copts(),
  354. tags = ["nowin32"],
  355. @@ -4858,13 +4870,13 @@ xnnpack_benchmark(
  356. )
  357. xnnpack_benchmark(
  358. - name = "global_average_pooling_bench",
  359. + name = "global_average_pooling_bench.wasm",
  360. srcs = ["bench/global-average-pooling.cc"],
  361. deps = OPERATOR_BENCHMARK_DEPS,
  362. )
  363. xnnpack_benchmark(
  364. - name = "hardswish_bench",
  365. + name = "hardswish_bench.wasm",
  366. srcs = ["bench/hardswish.cc"],
  367. copts = xnnpack_optional_tflite_copts(),
  368. tags = ["nowin32"],
  369. @@ -4872,13 +4884,13 @@ xnnpack_benchmark(
  370. )
  371. xnnpack_benchmark(
  372. - name = "max_pooling_bench",
  373. + name = "max_pooling_bench.wasm",
  374. srcs = ["bench/max-pooling.cc"],
  375. deps = OPERATOR_BENCHMARK_DEPS,
  376. )
  377. xnnpack_benchmark(
  378. - name = "sigmoid_bench",
  379. + name = "sigmoid_bench.wasm",
  380. srcs = ["bench/sigmoid.cc"],
  381. copts = xnnpack_optional_tflite_copts(),
  382. tags = ["nowin32"],
  383. @@ -4886,7 +4898,7 @@ xnnpack_benchmark(
  384. )
  385. xnnpack_benchmark(
  386. - name = "prelu_bench",
  387. + name = "prelu_bench.wasm",
  388. srcs = ["bench/prelu.cc"],
  389. copts = xnnpack_optional_tflite_copts(),
  390. tags = ["nowin32"],
  391. @@ -4894,7 +4906,7 @@ xnnpack_benchmark(
  392. )
  393. xnnpack_benchmark(
  394. - name = "softmax_bench",
  395. + name = "softmax_bench.wasm",
  396. srcs = ["bench/softmax.cc"],
  397. copts = xnnpack_optional_tflite_copts(),
  398. tags = ["nowin32"],
  399. @@ -4902,7 +4914,7 @@ xnnpack_benchmark(
  400. )
  401. xnnpack_benchmark(
  402. - name = "square_root_bench",
  403. + name = "square_root_bench.wasm",
  404. srcs = ["bench/square-root.cc"],
  405. copts = xnnpack_optional_tflite_copts(),
  406. tags = ["nowin32"],
  407. @@ -4910,7 +4922,7 @@ xnnpack_benchmark(
  408. )
  409. xnnpack_benchmark(
  410. - name = "truncation_bench",
  411. + name = "truncation_bench.wasm",
  412. srcs = ["bench/truncation.cc"],
  413. deps = OPERATOR_BENCHMARK_DEPS,
  414. )
  415. @@ -4918,7 +4930,7 @@ xnnpack_benchmark(
  416. ############################# End-to-end benchmarks ############################
  417. cc_library(
  418. - name = "fp32_mobilenet_v1",
  419. + name = "fp32_mobilenet_v1.wasm",
  420. srcs = ["models/fp32-mobilenet-v1.cc"],
  421. hdrs = ["models/models.h"],
  422. copts = xnnpack_std_cxxopts(),
  423. @@ -4930,7 +4942,7 @@ cc_library(
  424. )
  425. cc_library(
  426. - name = "fp16_mobilenet_v1",
  427. + name = "fp16_mobilenet_v1.wasm",
  428. srcs = ["models/fp16-mobilenet-v1.cc"],
  429. hdrs = ["models/models.h"],
  430. copts = xnnpack_std_cxxopts(),
  431. @@ -4943,7 +4955,7 @@ cc_library(
  432. )
  433. cc_library(
  434. - name = "qs8_mobilenet_v1",
  435. + name = "qs8_mobilenet_v1.wasm",
  436. srcs = ["models/qs8-mobilenet-v1.cc"],
  437. hdrs = ["models/models.h"],
  438. copts = xnnpack_std_cxxopts(),
  439. @@ -4955,7 +4967,7 @@ cc_library(
  440. )
  441. cc_library(
  442. - name = "qs8_mobilenet_v2",
  443. + name = "qs8_mobilenet_v2.wasm",
  444. srcs = ["models/qs8-mobilenet-v2.cc"],
  445. hdrs = ["models/models.h"],
  446. copts = xnnpack_std_cxxopts(),
  447. @@ -4967,7 +4979,7 @@ cc_library(
  448. )
  449. cc_library(
  450. - name = "fp32_mobilenet_v2",
  451. + name = "fp32_mobilenet_v2.wasm",
  452. srcs = ["models/fp32-mobilenet-v2.cc"],
  453. hdrs = ["models/models.h"],
  454. copts = xnnpack_std_cxxopts(),
  455. @@ -4979,7 +4991,7 @@ cc_library(
  456. )
  457. cc_library(
  458. - name = "fp16_mobilenet_v2",
  459. + name = "fp16_mobilenet_v2.wasm",
  460. srcs = ["models/fp16-mobilenet-v2.cc"],
  461. hdrs = ["models/models.h"],
  462. copts = xnnpack_std_cxxopts(),
  463. @@ -4992,7 +5004,7 @@ cc_library(
  464. )
  465. cc_library(
  466. - name = "fp32_mobilenet_v3_large",
  467. + name = "fp32_mobilenet_v3_large.wasm",
  468. srcs = ["models/fp32-mobilenet-v3-large.cc"],
  469. hdrs = ["models/models.h"],
  470. copts = xnnpack_std_cxxopts(),
  471. @@ -5004,7 +5016,7 @@ cc_library(
  472. )
  473. cc_library(
  474. - name = "fp16_mobilenet_v3_large",
  475. + name = "fp16_mobilenet_v3_large.wasm",
  476. srcs = ["models/fp16-mobilenet-v3-large.cc"],
  477. hdrs = ["models/models.h"],
  478. copts = xnnpack_std_cxxopts(),
  479. @@ -5017,7 +5029,7 @@ cc_library(
  480. )
  481. cc_library(
  482. - name = "fp32_mobilenet_v3_small",
  483. + name = "fp32_mobilenet_v3_small.wasm",
  484. srcs = ["models/fp32-mobilenet-v3-small.cc"],
  485. hdrs = ["models/models.h"],
  486. copts = xnnpack_std_cxxopts(),
  487. @@ -5029,7 +5041,7 @@ cc_library(
  488. )
  489. cc_library(
  490. - name = "fp16_mobilenet_v3_small",
  491. + name = "fp16_mobilenet_v3_small.wasm",
  492. srcs = ["models/fp16-mobilenet-v3-small.cc"],
  493. hdrs = ["models/models.h"],
  494. copts = xnnpack_std_cxxopts(),
  495. @@ -5042,51 +5054,51 @@ cc_library(
  496. )
  497. xnnpack_benchmark(
  498. - name = "f32_dwconv_e2e_bench",
  499. + name = "f32_dwconv_e2e_bench.wasm",
  500. srcs = [
  501. "bench/f32-dwconv-e2e.cc",
  502. "bench/end2end.h",
  503. ] + MICROKERNEL_BENCHMARK_HDRS,
  504. deps = MICROKERNEL_BENCHMARK_DEPS + [
  505. ":XNNPACK",
  506. - ":fp32_mobilenet_v1",
  507. - ":fp32_mobilenet_v2",
  508. - ":fp32_mobilenet_v3_large",
  509. - ":fp32_mobilenet_v3_small",
  510. + ":fp32_mobilenet_v1.wasm",
  511. + ":fp32_mobilenet_v2.wasm",
  512. + ":fp32_mobilenet_v3_large.wasm",
  513. + ":fp32_mobilenet_v3_small.wasm",
  514. ],
  515. )
  516. xnnpack_benchmark(
  517. - name = "f32_gemm_e2e_bench",
  518. + name = "f32_gemm_e2e_bench.wasm",
  519. srcs = [
  520. "bench/f32-gemm-e2e.cc",
  521. "bench/end2end.h",
  522. ] + MICROKERNEL_BENCHMARK_HDRS,
  523. deps = MICROKERNEL_BENCHMARK_DEPS + [
  524. ":XNNPACK",
  525. - ":fp32_mobilenet_v1",
  526. - ":fp32_mobilenet_v2",
  527. - ":fp32_mobilenet_v3_large",
  528. - ":fp32_mobilenet_v3_small",
  529. + ":fp32_mobilenet_v1.wasm",
  530. + ":fp32_mobilenet_v2.wasm",
  531. + ":fp32_mobilenet_v3_large.wasm",
  532. + ":fp32_mobilenet_v3_small.wasm",
  533. ],
  534. )
  535. xnnpack_benchmark(
  536. - name = "end2end_bench",
  537. + name = "end2end_bench.wasm",
  538. srcs = ["bench/end2end.cc"],
  539. deps = [
  540. ":XNNPACK",
  541. ":bench_utils",
  542. - ":fp16_mobilenet_v1",
  543. - ":fp16_mobilenet_v2",
  544. - ":fp16_mobilenet_v3_large",
  545. - ":fp16_mobilenet_v3_small",
  546. - ":fp32_mobilenet_v1",
  547. - ":fp32_mobilenet_v2",
  548. - ":fp32_mobilenet_v3_large",
  549. - ":fp32_mobilenet_v3_small",
  550. - ":qs8_mobilenet_v1",
  551. - ":qs8_mobilenet_v2",
  552. + ":fp16_mobilenet_v1.wasm",
  553. + ":fp16_mobilenet_v2.wasm",
  554. + ":fp16_mobilenet_v3_large.wasm",
  555. + ":fp16_mobilenet_v3_small.wasm",
  556. + ":fp32_mobilenet_v1.wasm",
  557. + ":fp32_mobilenet_v2.wasm",
  558. + ":fp32_mobilenet_v3_large.wasm",
  559. + ":fp32_mobilenet_v3_small.wasm",
  560. + ":qs8_mobilenet_v1.wasm",
  561. + ":qs8_mobilenet_v2.wasm",
  562. "@pthreadpool",
  563. ],
  564. )
  565. @@ -5094,7 +5106,7 @@ xnnpack_benchmark(
  566. #################### Accuracy evaluation for math functions ####################
  567. xnnpack_benchmark(
  568. - name = "f32_exp_eval",
  569. + name = "f32_exp_eval.wasm",
  570. srcs = [
  571. "eval/f32-exp.cc",
  572. "src/xnnpack/AlignedAllocator.h",
  573. @@ -5103,7 +5115,7 @@ xnnpack_benchmark(
  574. )
  575. xnnpack_benchmark(
  576. - name = "f32_expminus_eval",
  577. + name = "f32_expminus_eval.wasm",
  578. srcs = [
  579. "eval/f32-expminus.cc",
  580. "src/xnnpack/AlignedAllocator.h",
  581. @@ -5112,7 +5124,7 @@ xnnpack_benchmark(
  582. )
  583. xnnpack_benchmark(
  584. - name = "f32_extexp_eval",
  585. + name = "f32_extexp_eval.wasm",
  586. srcs = [
  587. "eval/f32-extexp.cc",
  588. "src/xnnpack/AlignedAllocator.h",
  589. @@ -5121,7 +5133,7 @@ xnnpack_benchmark(
  590. )
  591. xnnpack_unit_test(
  592. - name = "f32_roundne_eval",
  593. + name = "f32_roundne_eval.wasm",
  594. srcs = [
  595. "eval/f32-roundne.cc",
  596. "src/xnnpack/AlignedAllocator.h",
  597. @@ -5132,7 +5144,7 @@ xnnpack_unit_test(
  598. )
  599. xnnpack_unit_test(
  600. - name = "f32_roundd_eval",
  601. + name = "f32_roundd_eval.wasm",
  602. srcs = [
  603. "eval/f32-roundd.cc",
  604. "src/xnnpack/AlignedAllocator.h",
  605. @@ -5143,7 +5155,7 @@ xnnpack_unit_test(
  606. )
  607. xnnpack_unit_test(
  608. - name = "f32_roundu_eval",
  609. + name = "f32_roundu_eval.wasm",
  610. srcs = [
  611. "eval/f32-roundu.cc",
  612. "src/xnnpack/AlignedAllocator.h",
  613. @@ -5154,7 +5166,7 @@ xnnpack_unit_test(
  614. )
  615. xnnpack_unit_test(
  616. - name = "f32_roundz_eval",
  617. + name = "f32_roundz_eval.wasm",
  618. srcs = [
  619. "eval/f32-roundz.cc",
  620. "src/xnnpack/AlignedAllocator.h",
  621. @@ -5165,7 +5177,7 @@ xnnpack_unit_test(
  622. )
  623. xnnpack_benchmark(
  624. - name = "f32_sigmoid_eval",
  625. + name = "f32_sigmoid_eval.wasm",
  626. srcs = [
  627. "eval/f32-sigmoid.cc",
  628. "src/xnnpack/AlignedAllocator.h",
  629. @@ -5174,7 +5186,7 @@ xnnpack_benchmark(
  630. )
  631. xnnpack_benchmark(
  632. - name = "f32_sqrt_eval",
  633. + name = "f32_sqrt_eval.wasm",
  634. srcs = [
  635. "eval/f32-sqrt.cc",
  636. "src/xnnpack/AlignedAllocator.h",
  637. diff --git a/emscripten.bzl b/emscripten.bzl
  638. index faad087..2b4763f 100644
  639. --- a/emscripten.bzl
  640. +++ b/emscripten.bzl
  641. @@ -4,30 +4,25 @@ def xnnpack_emscripten_minimal_linkopts():
  642. """Minimal Emscripten-specific linkopts for binaries."""
  643. return [
  644. "-s ASSERTIONS=0",
  645. - "-s ERROR_ON_UNDEFINED_SYMBOLS=1",
  646. - "-s EXIT_RUNTIME=1",
  647. + "-s ERROR_ON_UNDEFINED_SYMBOLS=0",
  648. ]
  649. def xnnpack_emscripten_test_linkopts():
  650. """Emscripten-specific linkopts for unit tests."""
  651. return [
  652. "-s ASSERTIONS=2",
  653. - "-s ERROR_ON_UNDEFINED_SYMBOLS=1",
  654. + "-s ERROR_ON_UNDEFINED_SYMBOLS=0",
  655. "-s DEMANGLE_SUPPORT=1",
  656. - "-s EXIT_RUNTIME=1",
  657. "-s ALLOW_MEMORY_GROWTH=1",
  658. - "--pre-js $(location :preamble.js.lds)",
  659. ]
  660. def xnnpack_emscripten_benchmark_linkopts():
  661. """Emscripten-specific linkopts for benchmarks."""
  662. return [
  663. "-s ASSERTIONS=1",
  664. - "-s ERROR_ON_UNDEFINED_SYMBOLS=1",
  665. - "-s EXIT_RUNTIME=1",
  666. + "-s ERROR_ON_UNDEFINED_SYMBOLS=0",
  667. "-s ALLOW_MEMORY_GROWTH=1",
  668. "-s TOTAL_MEMORY=268435456", # 256M
  669. - "--pre-js $(location :preamble.js.lds)",
  670. ]
  671. def xnnpack_emscripten_deps():