| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285 |
- /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
- Licensed under the Apache License, Version 2.0 (the "License");
- you may not use this file except in compliance with the License.
- You may obtain a copy of the License at
- http://www.apache.org/licenses/LICENSE-2.0
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
- ==============================================================================*/
- #include "tensorflow/lite/c/builtin_op_data.h"
- #include "tensorflow/lite/c/common.h"
- #include "tensorflow/lite/kernels/internal/common.h"
- #include "tensorflow/lite/kernels/internal/quantization_util.h"
- #include "tensorflow/lite/kernels/internal/tensor_ctypes.h"
- #include "tensorflow/lite/kernels/internal/types.h"
- #include "tensorflow/lite/kernels/kernel_util.h"
- #include "tensorflow/lite/kernels/op_macros.h"
- #include "tensorflow/lite/micro/kernels/kernel_util.h"
- #include "tensorflow/lite/micro/micro_utils.h"
- namespace tflite {
- namespace ops {
- namespace micro {
- namespace activations {
- namespace {
- struct ReluOpData {
- ReluParams params;
- };
- struct Relu6OpData {
- int8_t six_int8;
- int8_t zero_int8;
- uint8_t six_uint8;
- uint8_t zero_uint8;
- };
- } // namespace
- constexpr int kInputTensor = 0;
- constexpr int kOutputTensor = 0;
- template <typename T>
- inline void ReluQuantized(const ReluOpData& data,
- const RuntimeShape& input_shape,
- const RuntimeShape& output_shape, const T* input_data,
- T* output_data) {
- const int flat_size = MatchingFlatSize(input_shape, output_shape);
- for (int i = 0; i < flat_size; ++i) {
- const int32_t val = static_cast<int32_t>(input_data[i]);
- int32_t clamped =
- data.params.output_offset +
- MultiplyByQuantizedMultiplier(val - data.params.input_offset,
- data.params.output_multiplier,
- data.params.output_shift);
- clamped = std::max(data.params.quantized_activation_min, clamped);
- clamped = std::min(data.params.quantized_activation_max, clamped);
- output_data[i] = static_cast<T>(clamped);
- }
- }
- template <typename T>
- inline void CalculateReluOpData(const TfLiteTensor* input, TfLiteTensor* output,
- ReluOpData* data) {
- float act_min = 0.0;
- float act_max = std::numeric_limits<float>::infinity();
- double real_multiplier =
- static_cast<double>(input->params.scale / output->params.scale);
- const RuntimeShape input_shape = GetTensorShape(input);
- const RuntimeShape output_shape = GetTensorShape(output);
- QuantizeMultiplier(real_multiplier, &data->params.output_multiplier,
- &data->params.output_shift);
- data->params.quantized_activation_min = std::max(
- static_cast<int32_t>(std::numeric_limits<T>::min()),
- output->params.zero_point +
- static_cast<int32_t>(roundf(act_min / output->params.scale)));
- data->params.quantized_activation_max =
- act_max == std::numeric_limits<float>::infinity()
- ? static_cast<int32_t>(std::numeric_limits<T>::max())
- : std::min(static_cast<int32_t>(std::numeric_limits<T>::max()),
- output->params.zero_point +
- static_cast<int32_t>(
- roundf(act_max / output->params.scale)));
- data->params.input_offset = input->params.zero_point;
- data->params.output_offset = output->params.zero_point;
- }
- inline void ReluFloat(const RuntimeShape& input_shape, const float* input_data,
- const RuntimeShape& output_shape, float* output_data) {
- const int flat_size = MatchingFlatSize(input_shape, output_shape);
- for (int i = 0; i < flat_size; ++i) {
- const float val = input_data[i];
- const float lower = 0.0f;
- const float clamped = val < lower ? lower : val;
- output_data[i] = clamped;
- }
- }
- inline void Relu6Float(const RuntimeShape& input_shape, const float* input_data,
- const RuntimeShape& output_shape, float* output_data) {
- const int flat_size = MatchingFlatSize(input_shape, output_shape);
- for (int i = 0; i < flat_size; ++i) {
- const float val = input_data[i];
- const float upper = 6.0f;
- const float lower = 0.0f;
- const float clamped = val > upper ? upper : val < lower ? lower : val;
- output_data[i] = clamped;
- }
- }
- template <typename Q>
- inline void Relu6Quantized(Q lower, Q upper, const RuntimeShape& input_shape,
- const Q* input_data,
- const RuntimeShape& output_shape, Q* output_data) {
- const int flat_size = MatchingFlatSize(input_shape, output_shape);
- for (int i = 0; i < flat_size; ++i) {
- const Q val = input_data[i];
- const Q clamped = val > upper ? upper : val < lower ? lower : val;
- output_data[i] = clamped;
- }
- }
- void* ReluInit(TfLiteContext* context, const char* buffer, size_t length) {
- TFLITE_DCHECK(context->AllocatePersistentBuffer != nullptr);
- return context->AllocatePersistentBuffer(context, sizeof(ReluOpData));
- }
- TfLiteStatus ReluPrepare(TfLiteContext* context, TfLiteNode* node) {
- TFLITE_DCHECK(node->user_data != nullptr);
- ReluOpData* data = static_cast<ReluOpData*>(node->user_data);
- const TfLiteTensor* input = GetInput(context, node, kInputTensor);
- TfLiteTensor* output = GetOutput(context, node, kOutputTensor);
- if (input->type == kTfLiteInt8) {
- CalculateReluOpData<int8_t>(input, output, data);
- } else if (input->type == kTfLiteUInt8) {
- CalculateReluOpData<uint8_t>(input, output, data);
- }
- return kTfLiteOk;
- }
- TfLiteStatus ReluEval(TfLiteContext* context, TfLiteNode* node) {
- TFLITE_DCHECK(node->user_data != nullptr);
- const ReluOpData& data = *(static_cast<const ReluOpData*>(node->user_data));
- const TfLiteEvalTensor* input =
- tflite::micro::GetEvalInput(context, node, kInputTensor);
- TfLiteEvalTensor* output =
- tflite::micro::GetEvalOutput(context, node, kOutputTensor);
- switch (input->type) {
- case kTfLiteFloat32: {
- ReluFloat(tflite::micro::GetTensorShape(input),
- tflite::micro::GetTensorData<float>(input),
- tflite::micro::GetTensorShape(output),
- tflite::micro::GetTensorData<float>(output));
- return kTfLiteOk;
- }
- case kTfLiteInt8: {
- ReluQuantized<int8_t>(data, tflite::micro::GetTensorShape(input),
- tflite::micro::GetTensorShape(output),
- tflite::micro::GetTensorData<int8_t>(input),
- tflite::micro::GetTensorData<int8_t>(output));
- return kTfLiteOk;
- }
- case kTfLiteUInt8: {
- ReluQuantized<uint8_t>(data, tflite::micro::GetTensorShape(input),
- tflite::micro::GetTensorShape(output),
- tflite::micro::GetTensorData<uint8_t>(input),
- tflite::micro::GetTensorData<uint8_t>(output));
- return kTfLiteOk;
- }
- default: {
- TF_LITE_KERNEL_LOG(context, "Only float32 is supported currently, got %s",
- TfLiteTypeGetName(input->type));
- return kTfLiteError;
- }
- }
- }
- void* Relu6Init(TfLiteContext* context, const char* buffer, size_t length) {
- TFLITE_DCHECK(context->AllocatePersistentBuffer != nullptr);
- return context->AllocatePersistentBuffer(context, sizeof(Relu6OpData));
- }
- TfLiteStatus Relu6Prepare(TfLiteContext* context, TfLiteNode* node) {
- TFLITE_DCHECK(node->user_data != nullptr);
- Relu6OpData* data = static_cast<Relu6OpData*>(node->user_data);
- const TfLiteTensor* input = GetInput(context, node, kInputTensor);
- if (input->type == kTfLiteInt8) {
- data->six_int8 = FloatToAsymmetricQuantizedInt8(6.0f, input->params.scale,
- input->params.zero_point);
- data->zero_int8 = input->params.zero_point;
- } else if (input->type == kTfLiteUInt8) {
- data->six_uint8 = FloatToAsymmetricQuantizedUInt8(6.0f, input->params.scale,
- input->params.zero_point);
- data->zero_uint8 = input->params.zero_point;
- }
- return kTfLiteOk;
- }
- TfLiteStatus Relu6Eval(TfLiteContext* context, TfLiteNode* node) {
- TFLITE_DCHECK(node->user_data != nullptr);
- const Relu6OpData& data = *(static_cast<const Relu6OpData*>(node->user_data));
- const TfLiteEvalTensor* input =
- tflite::micro::GetEvalInput(context, node, kInputTensor);
- TfLiteEvalTensor* output =
- tflite::micro::GetEvalOutput(context, node, kOutputTensor);
- switch (input->type) {
- case kTfLiteFloat32: {
- Relu6Float(tflite::micro::GetTensorShape(input),
- tflite::micro::GetTensorData<float>(input),
- tflite::micro::GetTensorShape(output),
- tflite::micro::GetTensorData<float>(output));
- return kTfLiteOk;
- }
- case kTfLiteInt8: {
- Relu6Quantized<int8_t>(data.zero_int8, data.six_int8,
- tflite::micro::GetTensorShape(input),
- tflite::micro::GetTensorData<int8_t>(input),
- tflite::micro::GetTensorShape(output),
- tflite::micro::GetTensorData<int8_t>(output));
- return kTfLiteOk;
- }
- case kTfLiteUInt8: {
- Relu6Quantized<uint8_t>(data.zero_uint8, data.six_uint8,
- tflite::micro::GetTensorShape(input),
- tflite::micro::GetTensorData<uint8_t>(input),
- tflite::micro::GetTensorShape(output),
- tflite::micro::GetTensorData<uint8_t>(output));
- return kTfLiteOk;
- }
- default: {
- TF_LITE_KERNEL_LOG(context, "Only float32 is supported currently, got %s",
- TfLiteTypeGetName(input->type));
- return kTfLiteError;
- }
- }
- }
- } // namespace activations
- TfLiteRegistration Register_RELU() {
- return {/*init=*/activations::ReluInit,
- /*free=*/nullptr,
- /*prepare=*/activations::ReluPrepare,
- /*invoke=*/activations::ReluEval,
- /*profiling_string=*/nullptr,
- /*builtin_code=*/0,
- /*custom_name=*/nullptr,
- /*version=*/0};
- }
- TfLiteRegistration Register_RELU6() {
- return {/*init=*/activations::Relu6Init,
- /*free=*/nullptr,
- /*prepare=*/activations::Relu6Prepare,
- /*invoke=*/activations::Relu6Eval,
- /*profiling_string=*/nullptr,
- /*builtin_code=*/0,
- /*custom_name=*/nullptr,
- /*version=*/0};
- }
- } // namespace micro
- } // namespace ops
- } // namespace tflite
|