arm_convolve_wrapper_s8.c 5.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131
  1. /*
  2. * Copyright (C) 2020 Arm Limited or its affiliates. All rights reserved.
  3. *
  4. * SPDX-License-Identifier: Apache-2.0
  5. *
  6. * Licensed under the Apache License, Version 2.0 (the License); you may
  7. * not use this file except in compliance with the License.
  8. * You may obtain a copy of the License at
  9. *
  10. * www.apache.org/licenses/LICENSE-2.0
  11. *
  12. * Unless required by applicable law or agreed to in writing, software
  13. * distributed under the License is distributed on an AS IS BASIS, WITHOUT
  14. * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  15. * See the License for the specific language governing permissions and
  16. * limitations under the License.
  17. */
  18. /* ----------------------------------------------------------------------
  19. * Project: CMSIS NN Library
  20. * Title: arm_convolve_wrapper_s8.c
  21. * Description: s8 convolution layer wrapper function with the main purpose to call the optimal kernel available in
  22. * cmsis-nn to perform the convolution.
  23. *
  24. * $Date: 09. October 2020
  25. * $Revision: V.1.0.1
  26. *
  27. * Target Processor: Cortex-M cores
  28. *
  29. * -------------------------------------------------------------------- */
  30. #include "arm_nnfunctions.h"
  31. /**
  32. * @ingroup groupNN
  33. */
  34. /**
  35. * @addtogroup NNConv
  36. * @{
  37. */
  38. /*
  39. * Convolution layer
  40. *
  41. * Refer header file for details.
  42. *
  43. */
  44. arm_status arm_convolve_wrapper_s8(const cmsis_nn_context *ctx,
  45. const cmsis_nn_conv_params *conv_params,
  46. const cmsis_nn_per_channel_quant_params *quant_params,
  47. const cmsis_nn_dims *input_dims,
  48. const q7_t *input_data,
  49. const cmsis_nn_dims *filter_dims,
  50. const q7_t *filter_data,
  51. const cmsis_nn_dims *bias_dims,
  52. const int32_t *bias_data,
  53. const cmsis_nn_dims *output_dims,
  54. q7_t *output_data)
  55. {
  56. if ((conv_params->padding.w == 0) && (conv_params->padding.h == 0) && (input_dims->c % 4 == 0) &&
  57. (conv_params->stride.w == 1) && (conv_params->stride.h == 1) && (filter_dims->w == 1) && (filter_dims->h == 1))
  58. {
  59. return arm_convolve_1x1_s8_fast(ctx,
  60. conv_params,
  61. quant_params,
  62. input_dims,
  63. input_data,
  64. filter_dims,
  65. filter_data,
  66. bias_dims,
  67. bias_data,
  68. output_dims,
  69. output_data);
  70. }
  71. else if ((output_dims->h == 1) && (input_dims->h == 1) && (filter_dims->h == 1) && (output_dims->w % 4 == 0) &&
  72. (input_dims->n == 1))
  73. {
  74. return arm_convolve_1_x_n_s8(ctx,
  75. conv_params,
  76. quant_params,
  77. input_dims,
  78. input_data,
  79. filter_dims,
  80. filter_data,
  81. bias_dims,
  82. bias_data,
  83. output_dims,
  84. output_data);
  85. }
  86. else
  87. {
  88. return arm_convolve_s8(ctx,
  89. conv_params,
  90. quant_params,
  91. input_dims,
  92. input_data,
  93. filter_dims,
  94. filter_data,
  95. bias_dims,
  96. bias_data,
  97. output_dims,
  98. output_data);
  99. }
  100. }
  101. int32_t arm_convolve_wrapper_s8_get_buffer_size(const cmsis_nn_conv_params *conv_params,
  102. const cmsis_nn_dims *input_dims,
  103. const cmsis_nn_dims *filter_dims,
  104. const cmsis_nn_dims *output_dims)
  105. {
  106. if ((conv_params->padding.w == 0) && (conv_params->padding.h == 0) && (input_dims->c % 4 == 0) &&
  107. (conv_params->stride.w == 1) && (conv_params->stride.h == 1) && (filter_dims->w == 1) && (filter_dims->h == 1))
  108. {
  109. return arm_convolve_1x1_s8_fast_get_buffer_size(input_dims);
  110. }
  111. else if ((output_dims->h == 1) && (input_dims->h == 1) && (filter_dims->h == 1) && (output_dims->w % 4 == 0) &&
  112. (input_dims->n == 1))
  113. {
  114. return arm_convolve_1_x_n_s8_get_buffer_size(input_dims, filter_dims);
  115. }
  116. else
  117. {
  118. return arm_convolve_s8_get_buffer_size(input_dims, filter_dims);
  119. }
  120. }
  121. /**
  122. * @} end of NNConv group
  123. */