xref: /aosp_15_r20/external/armnn/delegate/classic/src/Quantization.hpp (revision 89c4ff92f2867872bb9e2354d150bf0c8c502810)
1*89c4ff92SAndroid Build Coastguard Worker //
2*89c4ff92SAndroid Build Coastguard Worker // Copyright © 2022-2023 Arm Ltd and Contributors. All rights reserved.
3*89c4ff92SAndroid Build Coastguard Worker // SPDX-License-Identifier: MIT
4*89c4ff92SAndroid Build Coastguard Worker //
5*89c4ff92SAndroid Build Coastguard Worker 
6*89c4ff92SAndroid Build Coastguard Worker #pragma once
7*89c4ff92SAndroid Build Coastguard Worker 
8*89c4ff92SAndroid Build Coastguard Worker #include <armnn/utility/IgnoreUnused.hpp>
9*89c4ff92SAndroid Build Coastguard Worker 
10*89c4ff92SAndroid Build Coastguard Worker #include <tensorflow/lite/builtin_ops.h>
11*89c4ff92SAndroid Build Coastguard Worker #include <tensorflow/lite/c/builtin_op_data.h>
12*89c4ff92SAndroid Build Coastguard Worker #include <tensorflow/lite/c/common.h>
13*89c4ff92SAndroid Build Coastguard Worker #include <tensorflow/lite/minimal_logging.h>
14*89c4ff92SAndroid Build Coastguard Worker 
15*89c4ff92SAndroid Build Coastguard Worker namespace armnnDelegate
16*89c4ff92SAndroid Build Coastguard Worker {
17*89c4ff92SAndroid Build Coastguard Worker 
VisitDequantizeOperator(DelegateData & delegateData,TfLiteContext * tfLiteContext,TfLiteNode * tfLiteNode,int nodeIndex,int32_t tfLiteDequantizeOperatorCode)18*89c4ff92SAndroid Build Coastguard Worker TfLiteStatus VisitDequantizeOperator(DelegateData& delegateData,
19*89c4ff92SAndroid Build Coastguard Worker                                      TfLiteContext* tfLiteContext,
20*89c4ff92SAndroid Build Coastguard Worker                                      TfLiteNode* tfLiteNode,
21*89c4ff92SAndroid Build Coastguard Worker                                      int nodeIndex,
22*89c4ff92SAndroid Build Coastguard Worker                                      int32_t tfLiteDequantizeOperatorCode)
23*89c4ff92SAndroid Build Coastguard Worker {
24*89c4ff92SAndroid Build Coastguard Worker     TF_LITE_ENSURE_STATUS(ValidateNumInputs(tfLiteContext, tfLiteNode, 1, nodeIndex));
25*89c4ff92SAndroid Build Coastguard Worker     TF_LITE_ENSURE_STATUS(ValidateNumOutputs(tfLiteContext, tfLiteNode, 1, nodeIndex));
26*89c4ff92SAndroid Build Coastguard Worker 
27*89c4ff92SAndroid Build Coastguard Worker     const TfLiteTensor* tfLiteTensors = tfLiteContext->tensors;
28*89c4ff92SAndroid Build Coastguard Worker     const TfLiteTensor& tfLiteInputTensor = tfLiteTensors[tfLiteNode->inputs->data[0]];
29*89c4ff92SAndroid Build Coastguard Worker     if (IsDynamicTensor(tfLiteInputTensor))
30*89c4ff92SAndroid Build Coastguard Worker     {
31*89c4ff92SAndroid Build Coastguard Worker         TF_LITE_MAYBE_KERNEL_LOG(
32*89c4ff92SAndroid Build Coastguard Worker             tfLiteContext,
33*89c4ff92SAndroid Build Coastguard Worker             "TfLiteArmnnDelegate: Dynamic input tensors are not supported in operator #%d node #%d: ",
34*89c4ff92SAndroid Build Coastguard Worker             tfLiteDequantizeOperatorCode, nodeIndex);
35*89c4ff92SAndroid Build Coastguard Worker         return kTfLiteError;
36*89c4ff92SAndroid Build Coastguard Worker     }
37*89c4ff92SAndroid Build Coastguard Worker 
38*89c4ff92SAndroid Build Coastguard Worker     const TfLiteTensor& tfLiteOutputTensor = tfLiteTensors[tfLiteNode->outputs->data[0]];
39*89c4ff92SAndroid Build Coastguard Worker     if (IsDynamicTensor(tfLiteOutputTensor))
40*89c4ff92SAndroid Build Coastguard Worker     {
41*89c4ff92SAndroid Build Coastguard Worker         TF_LITE_MAYBE_KERNEL_LOG(
42*89c4ff92SAndroid Build Coastguard Worker             tfLiteContext,
43*89c4ff92SAndroid Build Coastguard Worker             "TfLiteArmnnDelegate: Dynamic output tensors are not supported in operator #%d node #%d: ",
44*89c4ff92SAndroid Build Coastguard Worker             tfLiteDequantizeOperatorCode, nodeIndex);
45*89c4ff92SAndroid Build Coastguard Worker 
46*89c4ff92SAndroid Build Coastguard Worker         return kTfLiteError;
47*89c4ff92SAndroid Build Coastguard Worker     }
48*89c4ff92SAndroid Build Coastguard Worker     const armnn::TensorInfo& inputTensorInfo = GetTensorInfoForTfLiteTensor(tfLiteInputTensor);
49*89c4ff92SAndroid Build Coastguard Worker     armnn::TensorInfo outputTensorInfo = GetTensorInfoForTfLiteTensor(tfLiteOutputTensor, true);
50*89c4ff92SAndroid Build Coastguard Worker 
51*89c4ff92SAndroid Build Coastguard Worker     UpdateConstantTensorOutputs(inputTensorInfo, outputTensorInfo);
52*89c4ff92SAndroid Build Coastguard Worker 
53*89c4ff92SAndroid Build Coastguard Worker     bool isSupported = false;
54*89c4ff92SAndroid Build Coastguard Worker     armnn::BackendId setBackend;
55*89c4ff92SAndroid Build Coastguard Worker     auto validateFunc = [&](const armnn::TensorInfo& outputTensorInfo, bool& isSupported)
56*89c4ff92SAndroid Build Coastguard Worker     {
57*89c4ff92SAndroid Build Coastguard Worker         FORWARD_LAYER_SUPPORT_FUNC("DEQUANTIZE",
58*89c4ff92SAndroid Build Coastguard Worker                                    tfLiteContext,
59*89c4ff92SAndroid Build Coastguard Worker                                    IsDequantizeSupported,
60*89c4ff92SAndroid Build Coastguard Worker                                    delegateData.m_Backends,
61*89c4ff92SAndroid Build Coastguard Worker                                    isSupported,
62*89c4ff92SAndroid Build Coastguard Worker                                    setBackend,
63*89c4ff92SAndroid Build Coastguard Worker                                    inputTensorInfo,
64*89c4ff92SAndroid Build Coastguard Worker                                    outputTensorInfo);
65*89c4ff92SAndroid Build Coastguard Worker     };
66*89c4ff92SAndroid Build Coastguard Worker 
67*89c4ff92SAndroid Build Coastguard Worker     if (!delegateData.m_Network)
68*89c4ff92SAndroid Build Coastguard Worker     {
69*89c4ff92SAndroid Build Coastguard Worker         validateFunc(outputTensorInfo, isSupported);
70*89c4ff92SAndroid Build Coastguard Worker         return isSupported ? kTfLiteOk : kTfLiteError;
71*89c4ff92SAndroid Build Coastguard Worker     }
72*89c4ff92SAndroid Build Coastguard Worker 
73*89c4ff92SAndroid Build Coastguard Worker     armnn::IConnectableLayer* dequantizeLayer = delegateData.m_Network->AddDequantizeLayer();
74*89c4ff92SAndroid Build Coastguard Worker     dequantizeLayer->SetBackendId(setBackend);
75*89c4ff92SAndroid Build Coastguard Worker     ARMNN_ASSERT(dequantizeLayer != nullptr);
76*89c4ff92SAndroid Build Coastguard Worker 
77*89c4ff92SAndroid Build Coastguard Worker     armnn::IOutputSlot& outputSlot = dequantizeLayer->GetOutputSlot(0);
78*89c4ff92SAndroid Build Coastguard Worker     outputSlot.SetTensorInfo(outputTensorInfo);
79*89c4ff92SAndroid Build Coastguard Worker 
80*89c4ff92SAndroid Build Coastguard Worker     auto inputsTensorsProcess = ProcessInputs(dequantizeLayer,
81*89c4ff92SAndroid Build Coastguard Worker                                               delegateData,
82*89c4ff92SAndroid Build Coastguard Worker                                               tfLiteContext,
83*89c4ff92SAndroid Build Coastguard Worker                                               tfLiteNode);
84*89c4ff92SAndroid Build Coastguard Worker     if (inputsTensorsProcess == kTfLiteError)
85*89c4ff92SAndroid Build Coastguard Worker     {
86*89c4ff92SAndroid Build Coastguard Worker         return inputsTensorsProcess;
87*89c4ff92SAndroid Build Coastguard Worker     }
88*89c4ff92SAndroid Build Coastguard Worker 
89*89c4ff92SAndroid Build Coastguard Worker     return Connect(dequantizeLayer, tfLiteNode, delegateData);
90*89c4ff92SAndroid Build Coastguard Worker }
91*89c4ff92SAndroid Build Coastguard Worker 
VisitQuantizeOperator(DelegateData & delegateData,TfLiteContext * tfLiteContext,TfLiteNode * tfLiteNode,int nodeIndex,int32_t tfLiteQuantizeOperatorCode)92*89c4ff92SAndroid Build Coastguard Worker TfLiteStatus VisitQuantizeOperator(DelegateData& delegateData,
93*89c4ff92SAndroid Build Coastguard Worker                                    TfLiteContext* tfLiteContext,
94*89c4ff92SAndroid Build Coastguard Worker                                    TfLiteNode* tfLiteNode,
95*89c4ff92SAndroid Build Coastguard Worker                                    int nodeIndex,
96*89c4ff92SAndroid Build Coastguard Worker                                    int32_t tfLiteQuantizeOperatorCode)
97*89c4ff92SAndroid Build Coastguard Worker {
98*89c4ff92SAndroid Build Coastguard Worker     TF_LITE_ENSURE_STATUS(ValidateNumInputs(tfLiteContext, tfLiteNode, 1, nodeIndex));
99*89c4ff92SAndroid Build Coastguard Worker     TF_LITE_ENSURE_STATUS(ValidateNumOutputs(tfLiteContext, tfLiteNode, 1, nodeIndex));
100*89c4ff92SAndroid Build Coastguard Worker 
101*89c4ff92SAndroid Build Coastguard Worker     const TfLiteTensor* tfLiteTensors = tfLiteContext->tensors;
102*89c4ff92SAndroid Build Coastguard Worker     const TfLiteTensor& tfLiteInputTensor = tfLiteTensors[tfLiteNode->inputs->data[0]];
103*89c4ff92SAndroid Build Coastguard Worker     if (IsDynamicTensor(tfLiteInputTensor))
104*89c4ff92SAndroid Build Coastguard Worker     {
105*89c4ff92SAndroid Build Coastguard Worker         TF_LITE_MAYBE_KERNEL_LOG(
106*89c4ff92SAndroid Build Coastguard Worker             tfLiteContext,
107*89c4ff92SAndroid Build Coastguard Worker             "TfLiteArmnnDelegate: Dynamic input tensors are not supported in operator #%d node #%d: ",
108*89c4ff92SAndroid Build Coastguard Worker             tfLiteQuantizeOperatorCode, nodeIndex);
109*89c4ff92SAndroid Build Coastguard Worker         return kTfLiteError;
110*89c4ff92SAndroid Build Coastguard Worker     }
111*89c4ff92SAndroid Build Coastguard Worker 
112*89c4ff92SAndroid Build Coastguard Worker     const TfLiteTensor& tfLiteOutputTensor = tfLiteTensors[tfLiteNode->outputs->data[0]];
113*89c4ff92SAndroid Build Coastguard Worker     if (IsDynamicTensor(tfLiteOutputTensor))
114*89c4ff92SAndroid Build Coastguard Worker     {
115*89c4ff92SAndroid Build Coastguard Worker         TF_LITE_MAYBE_KERNEL_LOG(
116*89c4ff92SAndroid Build Coastguard Worker             tfLiteContext,
117*89c4ff92SAndroid Build Coastguard Worker             "TfLiteArmnnDelegate: Dynamic output tensors are not supported in operator #%d node #%d: ",
118*89c4ff92SAndroid Build Coastguard Worker             tfLiteQuantizeOperatorCode, nodeIndex);
119*89c4ff92SAndroid Build Coastguard Worker         return kTfLiteError;
120*89c4ff92SAndroid Build Coastguard Worker     }
121*89c4ff92SAndroid Build Coastguard Worker 
122*89c4ff92SAndroid Build Coastguard Worker     // Only affine per-layer quantization is supported.
123*89c4ff92SAndroid Build Coastguard Worker     if (!IsAffineQuantization(tfLiteOutputTensor))
124*89c4ff92SAndroid Build Coastguard Worker     {
125*89c4ff92SAndroid Build Coastguard Worker         TF_LITE_MAYBE_KERNEL_LOG(
126*89c4ff92SAndroid Build Coastguard Worker             tfLiteContext,
127*89c4ff92SAndroid Build Coastguard Worker             "TfLiteArmnnDelegate: Only affine per-layer quantization is supported in operator #%d node #%d: ",
128*89c4ff92SAndroid Build Coastguard Worker             tfLiteQuantizeOperatorCode, nodeIndex);
129*89c4ff92SAndroid Build Coastguard Worker         return kTfLiteError;
130*89c4ff92SAndroid Build Coastguard Worker     }
131*89c4ff92SAndroid Build Coastguard Worker 
132*89c4ff92SAndroid Build Coastguard Worker     const armnn::TensorInfo& inputTensorInfo = GetTensorInfoForTfLiteTensor(tfLiteInputTensor);
133*89c4ff92SAndroid Build Coastguard Worker     const armnn::TensorInfo& outputTensorInfo = GetTensorInfoForTfLiteTensor(tfLiteOutputTensor, true);
134*89c4ff92SAndroid Build Coastguard Worker 
135*89c4ff92SAndroid Build Coastguard Worker     bool isSupported = false;
136*89c4ff92SAndroid Build Coastguard Worker     armnn::BackendId setBackend;
137*89c4ff92SAndroid Build Coastguard Worker     auto validateFunc = [&](const armnn::TensorInfo& outputTensorInfo, bool& isSupported)
138*89c4ff92SAndroid Build Coastguard Worker     {
139*89c4ff92SAndroid Build Coastguard Worker         FORWARD_LAYER_SUPPORT_FUNC("QUANTIZE",
140*89c4ff92SAndroid Build Coastguard Worker                                    tfLiteContext,
141*89c4ff92SAndroid Build Coastguard Worker                                    IsQuantizeSupported,
142*89c4ff92SAndroid Build Coastguard Worker                                    delegateData.m_Backends,
143*89c4ff92SAndroid Build Coastguard Worker                                    isSupported,
144*89c4ff92SAndroid Build Coastguard Worker                                    setBackend,
145*89c4ff92SAndroid Build Coastguard Worker                                    inputTensorInfo,
146*89c4ff92SAndroid Build Coastguard Worker                                    outputTensorInfo);
147*89c4ff92SAndroid Build Coastguard Worker     };
148*89c4ff92SAndroid Build Coastguard Worker 
149*89c4ff92SAndroid Build Coastguard Worker     if (!delegateData.m_Network)
150*89c4ff92SAndroid Build Coastguard Worker     {
151*89c4ff92SAndroid Build Coastguard Worker         validateFunc(outputTensorInfo, isSupported);
152*89c4ff92SAndroid Build Coastguard Worker         return isSupported ? kTfLiteOk : kTfLiteError;
153*89c4ff92SAndroid Build Coastguard Worker     }
154*89c4ff92SAndroid Build Coastguard Worker 
155*89c4ff92SAndroid Build Coastguard Worker     armnn::IConnectableLayer* quantizeLayer = delegateData.m_Network->AddQuantizeLayer();
156*89c4ff92SAndroid Build Coastguard Worker     quantizeLayer->SetBackendId(setBackend);
157*89c4ff92SAndroid Build Coastguard Worker     ARMNN_ASSERT(quantizeLayer != nullptr);
158*89c4ff92SAndroid Build Coastguard Worker 
159*89c4ff92SAndroid Build Coastguard Worker     armnn::IOutputSlot& outputSlot = quantizeLayer->GetOutputSlot(0);
160*89c4ff92SAndroid Build Coastguard Worker     outputSlot.SetTensorInfo(outputTensorInfo);
161*89c4ff92SAndroid Build Coastguard Worker 
162*89c4ff92SAndroid Build Coastguard Worker     // try to connect the Constant Inputs if there are any
163*89c4ff92SAndroid Build Coastguard Worker     if(ProcessInputs(quantizeLayer,delegateData, tfLiteContext, tfLiteNode) != kTfLiteOk )
164*89c4ff92SAndroid Build Coastguard Worker     {
165*89c4ff92SAndroid Build Coastguard Worker         return kTfLiteError;
166*89c4ff92SAndroid Build Coastguard Worker     }
167*89c4ff92SAndroid Build Coastguard Worker 
168*89c4ff92SAndroid Build Coastguard Worker     return Connect(quantizeLayer, tfLiteNode, delegateData);
169*89c4ff92SAndroid Build Coastguard Worker }
170*89c4ff92SAndroid Build Coastguard Worker 
171*89c4ff92SAndroid Build Coastguard Worker } // namespace armnnDelegate
172