xnnpack.patch 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665
  1. diff --git a/.bazelrc b/.bazelrc
  2. index ec740f38..2c193244 100644
  3. --- a/.bazelrc
  4. +++ b/.bazelrc
  5. @@ -49,4 +49,10 @@ build:ios_fat --watchos_cpus=armv7k
  6. build:macos --apple_platform_type=macos
  7. build:macos_arm64 --config=macos
  8. -build:macos_arm64 --cpu=darwin_arm64
  9. \ No newline at end of file
  10. +build:macos_arm64 --cpu=darwin_arm64
  11. +
  12. +build:wasm --copt=-msimd128
  13. +build:wasm --cpu=wasm
  14. +build:wasm --crosstool_top=@emsdk//emscripten_toolchain:everything
  15. +build:wasm --host_crosstool_top=@bazel_tools//tools/cpp:toolchain
  16. +
  17. diff --git a/BUILD.bazel b/BUILD.bazel
  18. index 1f2b15a8..e7abf838 100644
  19. --- a/BUILD.bazel
  20. +++ b/BUILD.bazel
  21. @@ -4996,7 +4996,7 @@ xnnpack_cc_library(
  22. ######################### Benchmarks for micro-kernels #########################
  23. xnnpack_benchmark(
  24. - name = "qs8_gemm_bench",
  25. + name = "qs8_gemm_bench.wasm",
  26. srcs = [
  27. "bench/gemm.h",
  28. "bench/qs8-gemm.cc",
  29. @@ -5007,7 +5007,7 @@ xnnpack_benchmark(
  30. )
  31. xnnpack_benchmark(
  32. - name = "qs8_requantization_bench",
  33. + name = "qs8_requantization_bench.wasm",
  34. srcs = [
  35. "bench/qs8-requantization.cc",
  36. "src/xnnpack/AlignedAllocator.h",
  37. @@ -5017,7 +5017,7 @@ xnnpack_benchmark(
  38. )
  39. xnnpack_benchmark(
  40. - name = "qu8_gemm_bench",
  41. + name = "qu8_gemm_bench.wasm",
  42. srcs = [
  43. "bench/gemm.h",
  44. "bench/qu8-gemm.cc",
  45. @@ -5028,7 +5028,7 @@ xnnpack_benchmark(
  46. )
  47. xnnpack_benchmark(
  48. - name = "qu8_requantization_bench",
  49. + name = "qu8_requantization_bench.wasm",
  50. srcs = [
  51. "bench/qu8-requantization.cc",
  52. "src/xnnpack/AlignedAllocator.h",
  53. @@ -5038,11 +5038,10 @@ xnnpack_benchmark(
  54. )
  55. xnnpack_benchmark(
  56. - name = "f16_igemm_bench",
  57. + name = "f16_igemm_bench.wasm",
  58. srcs = [
  59. "bench/f16-igemm.cc",
  60. "bench/conv.h",
  61. - "bench/google/conv.h",
  62. "src/xnnpack/AlignedAllocator.h",
  63. ] + MICROKERNEL_BENCHMARK_HDRS,
  64. deps = MICROKERNEL_BENCHMARK_DEPS + [
  65. @@ -5052,7 +5051,7 @@ xnnpack_benchmark(
  66. )
  67. xnnpack_benchmark(
  68. - name = "f16_gemm_bench",
  69. + name = "f16_gemm_bench.wasm",
  70. srcs = [
  71. "bench/f16-gemm.cc",
  72. "bench/gemm.h",
  73. @@ -5064,7 +5063,7 @@ xnnpack_benchmark(
  74. )
  75. xnnpack_benchmark(
  76. - name = "f16_spmm_bench",
  77. + name = "f16_spmm_bench.wasm",
  78. srcs = [
  79. "bench/f16-spmm.cc",
  80. "bench/spmm.h",
  81. @@ -5074,7 +5073,7 @@ xnnpack_benchmark(
  82. )
  83. xnnpack_benchmark(
  84. - name = "f32_igemm_bench",
  85. + name = "f32_igemm_bench.wasm",
  86. srcs = [
  87. "bench/f32-igemm.cc",
  88. "bench/conv.h",
  89. @@ -5087,7 +5086,7 @@ xnnpack_benchmark(
  90. )
  91. xnnpack_benchmark(
  92. - name = "f16_relu_bench",
  93. + name = "f16_relu_bench.wasm",
  94. srcs = [
  95. "bench/f16-relu.cc",
  96. "src/xnnpack/AlignedAllocator.h",
  97. @@ -5096,7 +5095,7 @@ xnnpack_benchmark(
  98. )
  99. xnnpack_benchmark(
  100. - name = "f32_conv_hwc_bench",
  101. + name = "f32_conv_hwc_bench.wasm",
  102. srcs = [
  103. "bench/f32-conv-hwc.cc",
  104. "bench/dconv.h",
  105. @@ -5108,7 +5107,7 @@ xnnpack_benchmark(
  106. )
  107. xnnpack_benchmark(
  108. - name = "f32_conv_hwc2chw_bench",
  109. + name = "f32_conv_hwc2chw_bench.wasm",
  110. srcs = [
  111. "bench/f32-conv-hwc2chw.cc",
  112. "bench/dconv.h",
  113. @@ -5120,11 +5119,10 @@ xnnpack_benchmark(
  114. )
  115. xnnpack_benchmark(
  116. - name = "f16_dwconv_bench",
  117. + name = "f16_dwconv_bench.wasm",
  118. srcs = [
  119. "bench/f16-dwconv.cc",
  120. "bench/dwconv.h",
  121. - "bench/google/dwconv.h",
  122. "src/xnnpack/AlignedAllocator.h",
  123. ] + MICROKERNEL_BENCHMARK_HDRS,
  124. deps = MICROKERNEL_BENCHMARK_DEPS + [
  125. @@ -5134,7 +5132,7 @@ xnnpack_benchmark(
  126. )
  127. xnnpack_benchmark(
  128. - name = "f32_dwconv_bench",
  129. + name = "f32_dwconv_bench.wasm",
  130. srcs = [
  131. "bench/f32-dwconv.cc",
  132. "bench/dwconv.h",
  133. @@ -5147,7 +5145,7 @@ xnnpack_benchmark(
  134. )
  135. xnnpack_benchmark(
  136. - name = "f32_dwconv2d_chw_bench",
  137. + name = "f32_dwconv2d_chw_bench.wasm",
  138. srcs = [
  139. "bench/f32-dwconv2d-chw.cc",
  140. "bench/dwconv.h",
  141. @@ -5160,7 +5158,7 @@ xnnpack_benchmark(
  142. )
  143. xnnpack_benchmark(
  144. - name = "f32_gemm_bench",
  145. + name = "f32_gemm_bench.wasm",
  146. srcs = [
  147. "bench/f32-gemm.cc",
  148. "bench/gemm.h",
  149. @@ -5171,7 +5169,7 @@ xnnpack_benchmark(
  150. )
  151. xnnpack_benchmark(
  152. - name = "f32_hswish_bench",
  153. + name = "f32_hswish_bench.wasm",
  154. srcs = [
  155. "bench/f32-hswish.cc",
  156. "src/xnnpack/AlignedAllocator.h",
  157. @@ -5180,7 +5178,7 @@ xnnpack_benchmark(
  158. )
  159. xnnpack_benchmark(
  160. - name = "f32_raddexpminusmax_bench",
  161. + name = "f32_raddexpminusmax_bench.wasm",
  162. srcs = [
  163. "bench/f32-raddexpminusmax.cc",
  164. "src/xnnpack/AlignedAllocator.h",
  165. @@ -5189,7 +5187,7 @@ xnnpack_benchmark(
  166. )
  167. xnnpack_benchmark(
  168. - name = "f32_raddextexp_bench",
  169. + name = "f32_raddextexp_bench.wasm",
  170. srcs = [
  171. "bench/f32-raddextexp.cc",
  172. "src/xnnpack/AlignedAllocator.h",
  173. @@ -5198,7 +5196,7 @@ xnnpack_benchmark(
  174. )
  175. xnnpack_benchmark(
  176. - name = "f32_raddstoreexpminusmax_bench",
  177. + name = "f32_raddstoreexpminusmax_bench.wasm",
  178. srcs = [
  179. "bench/f32-raddstoreexpminusmax.cc",
  180. "src/xnnpack/AlignedAllocator.h",
  181. @@ -5207,7 +5205,7 @@ xnnpack_benchmark(
  182. )
  183. xnnpack_benchmark(
  184. - name = "f32_relu_bench",
  185. + name = "f32_relu_bench.wasm",
  186. srcs = [
  187. "bench/f32-relu.cc",
  188. "src/xnnpack/AlignedAllocator.h",
  189. @@ -5216,7 +5214,7 @@ xnnpack_benchmark(
  190. )
  191. xnnpack_benchmark(
  192. - name = "f32_rmax_bench",
  193. + name = "f32_rmax_bench.wasm",
  194. srcs = [
  195. "bench/f32-rmax.cc",
  196. "src/xnnpack/AlignedAllocator.h",
  197. @@ -5225,7 +5223,7 @@ xnnpack_benchmark(
  198. )
  199. xnnpack_benchmark(
  200. - name = "f32_sigmoid_bench",
  201. + name = "f32_sigmoid_bench.wasm",
  202. srcs = [
  203. "bench/f32-sigmoid.cc",
  204. "src/xnnpack/AlignedAllocator.h",
  205. @@ -5234,7 +5232,7 @@ xnnpack_benchmark(
  206. )
  207. xnnpack_benchmark(
  208. - name = "f32_spmm_bench",
  209. + name = "f32_spmm_bench.wasm",
  210. srcs = [
  211. "bench/f32-spmm.cc",
  212. "bench/spmm.h",
  213. @@ -5244,7 +5242,7 @@ xnnpack_benchmark(
  214. )
  215. xnnpack_benchmark(
  216. - name = "f32_softmax_bench",
  217. + name = "f32_softmax_bench.wasm",
  218. srcs = [
  219. "bench/f32-softmax.cc",
  220. ] + MICROKERNEL_BENCHMARK_HDRS,
  221. @@ -5253,7 +5251,7 @@ xnnpack_benchmark(
  222. )
  223. xnnpack_benchmark(
  224. - name = "f32_velu_bench",
  225. + name = "f32_velu_bench.wasm",
  226. srcs = [
  227. "bench/f32-velu.cc",
  228. "src/xnnpack/AlignedAllocator.h",
  229. @@ -5262,7 +5260,7 @@ xnnpack_benchmark(
  230. )
  231. xnnpack_benchmark(
  232. - name = "f32_vscaleexpminusmax_bench",
  233. + name = "f32_vscaleexpminusmax_bench.wasm",
  234. srcs = [
  235. "bench/f32-vscaleexpminusmax.cc",
  236. "src/xnnpack/AlignedAllocator.h",
  237. @@ -5271,7 +5269,7 @@ xnnpack_benchmark(
  238. )
  239. xnnpack_benchmark(
  240. - name = "f32_vscaleextexp_bench",
  241. + name = "f32_vscaleextexp_bench.wasm",
  242. srcs = [
  243. "bench/f32-vscaleextexp.cc",
  244. "src/xnnpack/AlignedAllocator.h",
  245. @@ -5280,7 +5278,7 @@ xnnpack_benchmark(
  246. )
  247. xnnpack_benchmark(
  248. - name = "f32_vsqrt_bench",
  249. + name = "f32_vsqrt_bench.wasm",
  250. srcs = [
  251. "bench/f32-vsqrt.cc",
  252. "src/xnnpack/AlignedAllocator.h",
  253. @@ -5289,7 +5287,7 @@ xnnpack_benchmark(
  254. )
  255. xnnpack_benchmark(
  256. - name = "f32_im2col_gemm_bench",
  257. + name = "f32_im2col_gemm_bench.wasm",
  258. srcs = [
  259. "bench/f32-im2col-gemm.cc",
  260. "bench/conv.h",
  261. @@ -5302,7 +5300,7 @@ xnnpack_benchmark(
  262. )
  263. xnnpack_benchmark(
  264. - name = "rounding_bench",
  265. + name = "rounding_bench.wasm",
  266. srcs = [
  267. "bench/rounding.cc",
  268. "src/xnnpack/AlignedAllocator.h",
  269. @@ -5314,7 +5312,7 @@ xnnpack_benchmark(
  270. ########################### Benchmarks for operators ###########################
  271. xnnpack_benchmark(
  272. - name = "average_pooling_bench",
  273. + name = "average_pooling_bench.wasm",
  274. srcs = ["bench/average-pooling.cc"],
  275. copts = xnnpack_optional_tflite_copts(),
  276. tags = ["nowin32"],
  277. @@ -5322,7 +5320,7 @@ xnnpack_benchmark(
  278. )
  279. xnnpack_benchmark(
  280. - name = "bankers_rounding_bench",
  281. + name = "bankers_rounding_bench.wasm",
  282. srcs = ["bench/bankers-rounding.cc"],
  283. copts = xnnpack_optional_tflite_copts(),
  284. tags = ["nowin32"],
  285. @@ -5330,7 +5328,7 @@ xnnpack_benchmark(
  286. )
  287. xnnpack_benchmark(
  288. - name = "ceiling_bench",
  289. + name = "ceiling_bench.wasm",
  290. srcs = ["bench/ceiling.cc"],
  291. copts = xnnpack_optional_tflite_copts(),
  292. tags = ["nowin32"],
  293. @@ -5338,13 +5336,13 @@ xnnpack_benchmark(
  294. )
  295. xnnpack_benchmark(
  296. - name = "channel_shuffle_bench",
  297. + name = "channel_shuffle_bench.wasm",
  298. srcs = ["bench/channel-shuffle.cc"],
  299. deps = OPERATOR_BENCHMARK_DEPS,
  300. )
  301. xnnpack_benchmark(
  302. - name = "convolution_bench",
  303. + name = "convolution_bench.wasm",
  304. srcs = ["bench/convolution.cc"],
  305. copts = xnnpack_optional_tflite_copts() + xnnpack_optional_armcl_copts(),
  306. tags = ["nowin32"],
  307. @@ -5352,7 +5350,7 @@ xnnpack_benchmark(
  308. )
  309. xnnpack_benchmark(
  310. - name = "deconvolution_bench",
  311. + name = "deconvolution_bench.wasm",
  312. srcs = ["bench/deconvolution.cc"],
  313. copts = xnnpack_optional_tflite_copts(),
  314. tags = ["nowin32"],
  315. @@ -5360,7 +5358,7 @@ xnnpack_benchmark(
  316. )
  317. xnnpack_benchmark(
  318. - name = "elu_bench",
  319. + name = "elu_bench.wasm",
  320. srcs = ["bench/elu.cc"],
  321. copts = xnnpack_optional_tflite_copts(),
  322. tags = ["nowin32"],
  323. @@ -5368,7 +5366,7 @@ xnnpack_benchmark(
  324. )
  325. xnnpack_benchmark(
  326. - name = "floor_bench",
  327. + name = "floor_bench.wasm",
  328. srcs = ["bench/floor.cc"],
  329. copts = xnnpack_optional_tflite_copts(),
  330. tags = ["nowin32"],
  331. @@ -5376,13 +5374,13 @@ xnnpack_benchmark(
  332. )
  333. xnnpack_benchmark(
  334. - name = "global_average_pooling_bench",
  335. + name = "global_average_pooling_bench.wasm",
  336. srcs = ["bench/global-average-pooling.cc"],
  337. deps = OPERATOR_BENCHMARK_DEPS,
  338. )
  339. xnnpack_benchmark(
  340. - name = "hardswish_bench",
  341. + name = "hardswish_bench.wasm",
  342. srcs = ["bench/hardswish.cc"],
  343. copts = xnnpack_optional_tflite_copts(),
  344. tags = ["nowin32"],
  345. @@ -5390,13 +5388,13 @@ xnnpack_benchmark(
  346. )
  347. xnnpack_benchmark(
  348. - name = "max_pooling_bench",
  349. + name = "max_pooling_bench.wasm",
  350. srcs = ["bench/max-pooling.cc"],
  351. deps = OPERATOR_BENCHMARK_DEPS,
  352. )
  353. xnnpack_benchmark(
  354. - name = "sigmoid_bench",
  355. + name = "sigmoid_bench.wasm",
  356. srcs = ["bench/sigmoid.cc"],
  357. copts = xnnpack_optional_tflite_copts(),
  358. tags = ["nowin32"],
  359. @@ -5404,7 +5402,7 @@ xnnpack_benchmark(
  360. )
  361. xnnpack_benchmark(
  362. - name = "prelu_bench",
  363. + name = "prelu_bench.wasm",
  364. srcs = ["bench/prelu.cc"],
  365. copts = xnnpack_optional_tflite_copts(),
  366. tags = ["nowin32"],
  367. @@ -5412,7 +5410,7 @@ xnnpack_benchmark(
  368. )
  369. xnnpack_benchmark(
  370. - name = "softmax_bench",
  371. + name = "softmax_bench.wasm",
  372. srcs = ["bench/softmax.cc"],
  373. copts = xnnpack_optional_tflite_copts(),
  374. tags = ["nowin32"],
  375. @@ -5420,7 +5418,7 @@ xnnpack_benchmark(
  376. )
  377. xnnpack_benchmark(
  378. - name = "square_root_bench",
  379. + name = "square_root_bench.wasm",
  380. srcs = ["bench/square-root.cc"],
  381. copts = xnnpack_optional_tflite_copts(),
  382. tags = ["nowin32"],
  383. @@ -5428,7 +5426,7 @@ xnnpack_benchmark(
  384. )
  385. xnnpack_benchmark(
  386. - name = "truncation_bench",
  387. + name = "truncation_bench.wasm",
  388. srcs = ["bench/truncation.cc"],
  389. deps = OPERATOR_BENCHMARK_DEPS,
  390. )
  391. @@ -5620,7 +5618,7 @@ cc_library(
  392. )
  393. xnnpack_benchmark(
  394. - name = "f32_dwconv_e2e_bench",
  395. + name = "f32_dwconv_e2e_bench.wasm",
  396. srcs = [
  397. "bench/f32-dwconv-e2e.cc",
  398. "bench/end2end.h",
  399. @@ -5635,7 +5633,7 @@ xnnpack_benchmark(
  400. )
  401. xnnpack_benchmark(
  402. - name = "f32_gemm_e2e_bench",
  403. + name = "f32_gemm_e2e_bench.wasm",
  404. srcs = [
  405. "bench/f32-gemm-e2e.cc",
  406. "bench/end2end.h",
  407. @@ -5650,7 +5648,7 @@ xnnpack_benchmark(
  408. )
  409. xnnpack_benchmark(
  410. - name = "qs8_gemm_e2e_bench",
  411. + name = "qs8_gemm_e2e_bench.wasm",
  412. srcs = [
  413. "bench/qs8-gemm-e2e.cc",
  414. "bench/end2end.h",
  415. @@ -5663,7 +5661,7 @@ xnnpack_benchmark(
  416. )
  417. xnnpack_benchmark(
  418. - name = "end2end_bench",
  419. + name = "end2end_bench.wasm",
  420. srcs = ["bench/end2end.cc"],
  421. deps = [
  422. ":XNNPACK",
  423. @@ -5690,7 +5688,7 @@ xnnpack_benchmark(
  424. #################### Accuracy evaluation for math functions ####################
  425. xnnpack_benchmark(
  426. - name = "f32_exp_ulp_eval",
  427. + name = "f32_exp_ulp_eval.wasm",
  428. srcs = [
  429. "eval/f32-exp-ulp.cc",
  430. "src/xnnpack/AlignedAllocator.h",
  431. @@ -5702,7 +5700,7 @@ xnnpack_benchmark(
  432. )
  433. xnnpack_benchmark(
  434. - name = "f32_expminus_ulp_eval",
  435. + name = "f32_expminus_ulp_eval.wasm",
  436. srcs = [
  437. "eval/f32-expminus-ulp.cc",
  438. "src/xnnpack/AlignedAllocator.h",
  439. @@ -5714,7 +5712,7 @@ xnnpack_benchmark(
  440. )
  441. xnnpack_benchmark(
  442. - name = "f32_expm1minus_ulp_eval",
  443. + name = "f32_expm1minus_ulp_eval.wasm",
  444. srcs = [
  445. "eval/f32-expm1minus-ulp.cc",
  446. "src/xnnpack/AlignedAllocator.h",
  447. @@ -5726,7 +5724,7 @@ xnnpack_benchmark(
  448. )
  449. xnnpack_benchmark(
  450. - name = "f32_extexp_ulp_eval",
  451. + name = "f32_extexp_ulp_eval.wasm",
  452. srcs = [
  453. "eval/f32-extexp-ulp.cc",
  454. "src/xnnpack/AlignedAllocator.h",
  455. @@ -5738,7 +5736,7 @@ xnnpack_benchmark(
  456. )
  457. xnnpack_benchmark(
  458. - name = "f32_sigmoid_ulp_eval",
  459. + name = "f32_sigmoid_ulp_eval.wasm",
  460. srcs = [
  461. "eval/f32-sigmoid-ulp.cc",
  462. "src/xnnpack/AlignedAllocator.h",
  463. @@ -5750,7 +5748,7 @@ xnnpack_benchmark(
  464. )
  465. xnnpack_benchmark(
  466. - name = "f32_sqrt_ulp_eval",
  467. + name = "f32_sqrt_ulp_eval.wasm",
  468. srcs = [
  469. "eval/f32-sqrt-ulp.cc",
  470. "src/xnnpack/AlignedAllocator.h",
  471. diff --git a/WORKSPACE b/WORKSPACE
  472. index 4fa1aa2f..6181aab2 100644
  473. --- a/WORKSPACE
  474. +++ b/WORKSPACE
  475. @@ -5,8 +5,8 @@ load("@bazel_tools//tools/build_defs/repo:http.bzl", "http_archive")
  476. # Bazel rule definitions
  477. http_archive(
  478. name = "rules_cc",
  479. - strip_prefix = "rules_cc-master",
  480. - urls = ["https://github.com/bazelbuild/rules_cc/archive/master.zip"],
  481. + strip_prefix = "rules_cc-main",
  482. + urls = ["https://github.com/bazelbuild/rules_cc/archive/main.zip"],
  483. )
  484. # Google Test framework, used by most unit-tests.
  485. @@ -19,8 +19,8 @@ http_archive(
  486. # Google Benchmark library, used in micro-benchmarks.
  487. http_archive(
  488. name = "com_google_benchmark",
  489. - strip_prefix = "benchmark-master",
  490. - urls = ["https://github.com/google/benchmark/archive/master.zip"],
  491. + strip_prefix = "benchmark-1.5.3",
  492. + urls = ["https://github.com/google/benchmark/archive/refs/tags/v1.5.3.zip"],
  493. )
  494. # FP16 library, used for half-precision conversions
  495. @@ -89,3 +89,18 @@ android_ndk_repository(name = "androidndk")
  496. # Android SDK location and API is auto-detected from $ANDROID_HOME environment variable
  497. android_sdk_repository(name = "androidsdk")
  498. +
  499. +# emscripten library
  500. +http_archive(
  501. + name = "emsdk",
  502. + strip_prefix = "emsdk-c1589b55641787d55d53e883852035beea9aec3f/bazel",
  503. + url = "https://github.com/emscripten-core/emsdk/archive/c1589b55641787d55d53e883852035beea9aec3f.tar.gz",
  504. + sha256 = "7a58a9996b113d3e0675df30b5f17e28aa47de2e684a844f05394fe2f6f12e8e",
  505. +)
  506. +
  507. +load("@emsdk//:deps.bzl", emsdk_deps = "deps")
  508. +emsdk_deps()
  509. +
  510. +load("@emsdk//:emscripten_deps.bzl", emsdk_emscripten_deps = "emscripten_deps")
  511. +emsdk_emscripten_deps()
  512. +
  513. diff --git a/build_defs.bzl b/build_defs.bzl
  514. index 10345032..0e926fca 100644
  515. --- a/build_defs.bzl
  516. +++ b/build_defs.bzl
  517. @@ -1,6 +1,6 @@
  518. """Build definitions and rules for XNNPACK."""
  519. -load(":emscripten.bzl", "xnnpack_emscripten_benchmark_linkopts", "xnnpack_emscripten_deps", "xnnpack_emscripten_minimal_linkopts", "xnnpack_emscripten_test_linkopts")
  520. +load(":emscripten.bzl", "xnnpack_emscripten_benchmark_linkopts", "xnnpack_emscripten_deps", "xnnpack_emscripten_minimal_linkopts", "xnnpack_emscripten_test_linkopts", "xnnpack_emscripten_benchmark_copts")
  521. def xnnpack_visibility():
  522. """Visibility of :XNNPACK target.
  523. @@ -424,10 +424,15 @@ def xnnpack_benchmark(name, srcs, copts = [], deps = [], tags = []):
  524. ":windows_x86_64_mingw": ["-Wno-unused-function"],
  525. ":windows_x86_64_msys": ["-Wno-unused-function"],
  526. ":windows_x86_64": [],
  527. + ":emscripten": xnnpack_emscripten_benchmark_copts(),
  528. + ":emscripten_wasm": xnnpack_emscripten_benchmark_copts(),
  529. + ":emscripten_wasmsimd": xnnpack_emscripten_benchmark_copts(),
  530. "//conditions:default": ["-Wno-unused-function"],
  531. }) + copts,
  532. linkopts = select({
  533. ":emscripten": xnnpack_emscripten_benchmark_linkopts(),
  534. + ":emscripten_wasm": xnnpack_emscripten_benchmark_linkopts(),
  535. + ":emscripten_wasmsimd": xnnpack_emscripten_benchmark_linkopts(),
  536. ":windows_x86_64_mingw": ["-lshlwapi"],
  537. ":windows_x86_64_msys": ["-lshlwapi"],
  538. "//conditions:default": [],
  539. diff --git a/emscripten.bzl b/emscripten.bzl
  540. index 0a0caedf..aafe3199 100644
  541. --- a/emscripten.bzl
  542. +++ b/emscripten.bzl
  543. @@ -6,6 +6,7 @@ def xnnpack_emscripten_minimal_linkopts():
  544. "-s ASSERTIONS=0",
  545. "-s ERROR_ON_UNDEFINED_SYMBOLS=1",
  546. "-s EXIT_RUNTIME=1",
  547. + "--oformat=wasm",
  548. ]
  549. def xnnpack_emscripten_test_linkopts():
  550. @@ -17,21 +18,36 @@ def xnnpack_emscripten_test_linkopts():
  551. "-s EXIT_RUNTIME=1",
  552. "-s ALLOW_MEMORY_GROWTH=1",
  553. "--pre-js $(location :preamble.js.lds)",
  554. + "--oformat=wasm",
  555. ]
  556. def xnnpack_emscripten_benchmark_linkopts():
  557. """Emscripten-specific linkopts for benchmarks."""
  558. return [
  559. "-s ASSERTIONS=1",
  560. - "-s ERROR_ON_UNDEFINED_SYMBOLS=1",
  561. - "-s EXIT_RUNTIME=1",
  562. - "-s ALLOW_MEMORY_GROWTH=1",
  563. + "-s ERROR_ON_UNDEFINED_SYMBOLS=0",
  564. + "-s ALLOW_MEMORY_GROWTH=0",
  565. "-s TOTAL_MEMORY=436207616", # 416M
  566. - "--pre-js $(location :preamble.js.lds)",
  567. + "-s USE_PTHREADS=0",
  568. + "-s STANDALONE_WASM=1",
  569. + "-Wno-unused",
  570. + "-Wl,--export=__heap_base",
  571. + "-Wl,--export=__data_end",
  572. + "-Wl,--export=malloc",
  573. + "-Wl,--export=free",
  574. + "--oformat=wasm",
  575. ]
  576. def xnnpack_emscripten_deps():
  577. """Emscripten-specific dependencies for unit tests and benchmarks."""
  578. + return []
  579. +
  580. +def xnnpack_emscripten_benchmark_copts():
  581. return [
  582. - ":preamble.js.lds",
  583. + "-s ASSERTIONS=1",
  584. + "-s ERROR_ON_UNDEFINED_SYMBOLS=0",
  585. + "-s ALLOW_MEMORY_GROWTH=0",
  586. + "-s USE_PTHREADS=0",
  587. + "-s STANDALONE_WASM=1",
  588. + "-Wno-unused",
  589. ]
  590. diff --git a/third_party/cpuinfo.BUILD b/third_party/cpuinfo.BUILD
  591. index 128d683e..f6c287c4 100644
  592. --- a/third_party/cpuinfo.BUILD
  593. +++ b/third_party/cpuinfo.BUILD
  594. @@ -343,5 +343,5 @@ config_setting(
  595. config_setting(
  596. name = "emscripten",
  597. - values = {"crosstool_top": "//toolchain:emscripten"},
  598. + values = {"crosstool_top": "@emsdk//emscripten_toolchain:everything"},
  599. )