xref: /aosp_15_r20/external/libhevc/common/ihevc_itrans_recon.c (revision c83a76b084498d55f252f48b2e3786804cdf24b7)
1*c83a76b0SSuyog Pawar /******************************************************************************
2*c83a76b0SSuyog Pawar *
3*c83a76b0SSuyog Pawar * Copyright (C) 2012 Ittiam Systems Pvt Ltd, Bangalore
4*c83a76b0SSuyog Pawar *
5*c83a76b0SSuyog Pawar * Licensed under the Apache License, Version 2.0 (the "License");
6*c83a76b0SSuyog Pawar * you may not use this file except in compliance with the License.
7*c83a76b0SSuyog Pawar * You may obtain a copy of the License at:
8*c83a76b0SSuyog Pawar *
9*c83a76b0SSuyog Pawar * http://www.apache.org/licenses/LICENSE-2.0
10*c83a76b0SSuyog Pawar *
11*c83a76b0SSuyog Pawar * Unless required by applicable law or agreed to in writing, software
12*c83a76b0SSuyog Pawar * distributed under the License is distributed on an "AS IS" BASIS,
13*c83a76b0SSuyog Pawar * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14*c83a76b0SSuyog Pawar * See the License for the specific language governing permissions and
15*c83a76b0SSuyog Pawar * limitations under the License.
16*c83a76b0SSuyog Pawar *
17*c83a76b0SSuyog Pawar ******************************************************************************/
18*c83a76b0SSuyog Pawar /**
19*c83a76b0SSuyog Pawar  *******************************************************************************
20*c83a76b0SSuyog Pawar  * @file
21*c83a76b0SSuyog Pawar  *  ihevc_itrans_recon.c
22*c83a76b0SSuyog Pawar  *
23*c83a76b0SSuyog Pawar  * @brief
24*c83a76b0SSuyog Pawar  *  Contains function definitions for inverse transform  and reconstruction
25*c83a76b0SSuyog Pawar  *
26*c83a76b0SSuyog Pawar  *
27*c83a76b0SSuyog Pawar  * @author
28*c83a76b0SSuyog Pawar  *  100470
29*c83a76b0SSuyog Pawar  *
30*c83a76b0SSuyog Pawar  * @par List of Functions:
31*c83a76b0SSuyog Pawar  *  - ihevc_itrans_recon_4x4_ttype1()
32*c83a76b0SSuyog Pawar  *  - ihevc_itrans_recon_4x4()
33*c83a76b0SSuyog Pawar  *
34*c83a76b0SSuyog Pawar  * @remarks
35*c83a76b0SSuyog Pawar  *  None
36*c83a76b0SSuyog Pawar  *
37*c83a76b0SSuyog Pawar  *******************************************************************************
38*c83a76b0SSuyog Pawar  */
39*c83a76b0SSuyog Pawar #include <stdio.h>
40*c83a76b0SSuyog Pawar #include <string.h>
41*c83a76b0SSuyog Pawar #include "ihevc_typedefs.h"
42*c83a76b0SSuyog Pawar #include "ihevc_macros.h"
43*c83a76b0SSuyog Pawar #include "ihevc_platform_macros.h"
44*c83a76b0SSuyog Pawar #include "ihevc_defs.h"
45*c83a76b0SSuyog Pawar #include "ihevc_trans_tables.h"
46*c83a76b0SSuyog Pawar #include "ihevc_itrans_recon.h"
47*c83a76b0SSuyog Pawar #include "ihevc_func_selector.h"
48*c83a76b0SSuyog Pawar #include "ihevc_trans_macros.h"
49*c83a76b0SSuyog Pawar 
50*c83a76b0SSuyog Pawar /* All the functions here are replicated from ihevc_itrans.c and modified to */
51*c83a76b0SSuyog Pawar /* include reconstruction */
52*c83a76b0SSuyog Pawar 
53*c83a76b0SSuyog Pawar /**
54*c83a76b0SSuyog Pawar  *******************************************************************************
55*c83a76b0SSuyog Pawar  *
56*c83a76b0SSuyog Pawar  * @brief
57*c83a76b0SSuyog Pawar  *  This function performs Inverse transform type 1 (DST)  and reconstruction
58*c83a76b0SSuyog Pawar  * for 4x4 input block
59*c83a76b0SSuyog Pawar  *
60*c83a76b0SSuyog Pawar  * @par Description:
61*c83a76b0SSuyog Pawar  *  Performs inverse transform and adds the prediction  data and clips output
62*c83a76b0SSuyog Pawar  * to 8 bit
63*c83a76b0SSuyog Pawar  *
64*c83a76b0SSuyog Pawar  * @param[in] pi2_src
65*c83a76b0SSuyog Pawar  *  Input 4x4 coefficients
66*c83a76b0SSuyog Pawar  *
67*c83a76b0SSuyog Pawar  * @param[in] pi2_tmp
68*c83a76b0SSuyog Pawar  *  Temporary 4x4 buffer for storing inverse
69*c83a76b0SSuyog Pawar  *
70*c83a76b0SSuyog Pawar  *  transform
71*c83a76b0SSuyog Pawar  *  1st stage output
72*c83a76b0SSuyog Pawar  *
73*c83a76b0SSuyog Pawar  * @param[in] pu1_pred
74*c83a76b0SSuyog Pawar  *  Prediction 4x4 block
75*c83a76b0SSuyog Pawar  *
76*c83a76b0SSuyog Pawar  * @param[out] pu1_dst
77*c83a76b0SSuyog Pawar  *  Output 4x4 block
78*c83a76b0SSuyog Pawar  *
79*c83a76b0SSuyog Pawar  * @param[in] src_strd
80*c83a76b0SSuyog Pawar  *  Input stride
81*c83a76b0SSuyog Pawar  *
82*c83a76b0SSuyog Pawar  * @param[in] pred_strd
83*c83a76b0SSuyog Pawar  *  Prediction stride
84*c83a76b0SSuyog Pawar  *
85*c83a76b0SSuyog Pawar  * @param[in] dst_strd
86*c83a76b0SSuyog Pawar  *  Output Stride
87*c83a76b0SSuyog Pawar  *
88*c83a76b0SSuyog Pawar  * @param[in] zero_cols
89*c83a76b0SSuyog Pawar  *  Zero columns in pi2_src
90*c83a76b0SSuyog Pawar  *
91*c83a76b0SSuyog Pawar  * @returns  Void
92*c83a76b0SSuyog Pawar  *
93*c83a76b0SSuyog Pawar  * @remarks
94*c83a76b0SSuyog Pawar  *  None
95*c83a76b0SSuyog Pawar  *
96*c83a76b0SSuyog Pawar  *******************************************************************************
97*c83a76b0SSuyog Pawar  */
98*c83a76b0SSuyog Pawar 
ihevc_itrans_recon_4x4_ttype1(WORD16 * pi2_src,WORD16 * pi2_tmp,UWORD8 * pu1_pred,UWORD8 * pu1_dst,WORD32 src_strd,WORD32 pred_strd,WORD32 dst_strd,WORD32 zero_cols,WORD32 zero_rows)99*c83a76b0SSuyog Pawar void ihevc_itrans_recon_4x4_ttype1(WORD16 *pi2_src,
100*c83a76b0SSuyog Pawar                                    WORD16 *pi2_tmp,
101*c83a76b0SSuyog Pawar                                    UWORD8 *pu1_pred,
102*c83a76b0SSuyog Pawar                                    UWORD8 *pu1_dst,
103*c83a76b0SSuyog Pawar                                    WORD32 src_strd,
104*c83a76b0SSuyog Pawar                                    WORD32 pred_strd,
105*c83a76b0SSuyog Pawar                                    WORD32 dst_strd,
106*c83a76b0SSuyog Pawar                                    WORD32 zero_cols,
107*c83a76b0SSuyog Pawar                                    WORD32 zero_rows)
108*c83a76b0SSuyog Pawar {
109*c83a76b0SSuyog Pawar     WORD32 i, c[4];
110*c83a76b0SSuyog Pawar     WORD32 add;
111*c83a76b0SSuyog Pawar     WORD32 shift;
112*c83a76b0SSuyog Pawar     WORD16 *pi2_tmp_orig;
113*c83a76b0SSuyog Pawar     WORD32 trans_size;
114*c83a76b0SSuyog Pawar     UNUSED(zero_rows);
115*c83a76b0SSuyog Pawar     trans_size = TRANS_SIZE_4;
116*c83a76b0SSuyog Pawar 
117*c83a76b0SSuyog Pawar     pi2_tmp_orig = pi2_tmp;
118*c83a76b0SSuyog Pawar 
119*c83a76b0SSuyog Pawar     /* Inverse Transform 1st stage */
120*c83a76b0SSuyog Pawar     shift = IT_SHIFT_STAGE_1;
121*c83a76b0SSuyog Pawar     add = 1 << (shift - 1);
122*c83a76b0SSuyog Pawar 
123*c83a76b0SSuyog Pawar     for(i = 0; i < trans_size; i++)
124*c83a76b0SSuyog Pawar     {
125*c83a76b0SSuyog Pawar         /* Checking for Zero Cols */
126*c83a76b0SSuyog Pawar         if((zero_cols & 1) == 1)
127*c83a76b0SSuyog Pawar         {
128*c83a76b0SSuyog Pawar             memset(pi2_tmp, 0, trans_size * sizeof(WORD16));
129*c83a76b0SSuyog Pawar         }
130*c83a76b0SSuyog Pawar         else
131*c83a76b0SSuyog Pawar         {
132*c83a76b0SSuyog Pawar             // Intermediate Variables
133*c83a76b0SSuyog Pawar             c[0] = pi2_src[0] + pi2_src[2 * src_strd];
134*c83a76b0SSuyog Pawar             c[1] = pi2_src[2 * src_strd] + pi2_src[3 * src_strd];
135*c83a76b0SSuyog Pawar             c[2] = pi2_src[0] - pi2_src[3 * src_strd];
136*c83a76b0SSuyog Pawar             c[3] = 74 * pi2_src[src_strd];
137*c83a76b0SSuyog Pawar 
138*c83a76b0SSuyog Pawar             pi2_tmp[0] =
139*c83a76b0SSuyog Pawar                             CLIP_S16((29 * c[0] + 55 * c[1] + c[3] + add) >> shift);
140*c83a76b0SSuyog Pawar             pi2_tmp[1] =
141*c83a76b0SSuyog Pawar                             CLIP_S16((55 * c[2] - 29 * c[1] + c[3] + add) >> shift);
142*c83a76b0SSuyog Pawar             pi2_tmp[2] =
143*c83a76b0SSuyog Pawar                             CLIP_S16((74 * (pi2_src[0] - pi2_src[2 * src_strd] + pi2_src[3 * src_strd]) + add) >> shift);
144*c83a76b0SSuyog Pawar             pi2_tmp[3] =
145*c83a76b0SSuyog Pawar                             CLIP_S16((55 * c[0] + 29 * c[2] - c[3] + add) >> shift);
146*c83a76b0SSuyog Pawar         }
147*c83a76b0SSuyog Pawar         pi2_src++;
148*c83a76b0SSuyog Pawar         pi2_tmp += trans_size;
149*c83a76b0SSuyog Pawar         zero_cols = zero_cols >> 1;
150*c83a76b0SSuyog Pawar     }
151*c83a76b0SSuyog Pawar 
152*c83a76b0SSuyog Pawar     pi2_tmp = pi2_tmp_orig;
153*c83a76b0SSuyog Pawar 
154*c83a76b0SSuyog Pawar     /* Inverse Transform 2nd stage */
155*c83a76b0SSuyog Pawar     shift = IT_SHIFT_STAGE_2;
156*c83a76b0SSuyog Pawar     add = 1 << (shift - 1);
157*c83a76b0SSuyog Pawar 
158*c83a76b0SSuyog Pawar     for(i = 0; i < trans_size; i++)
159*c83a76b0SSuyog Pawar     {
160*c83a76b0SSuyog Pawar         WORD32 itrans_out;
161*c83a76b0SSuyog Pawar         // Intermediate Variables
162*c83a76b0SSuyog Pawar         c[0] = pi2_tmp[0] + pi2_tmp[2 * trans_size];
163*c83a76b0SSuyog Pawar         c[1] = pi2_tmp[2 * trans_size] + pi2_tmp[3 * trans_size];
164*c83a76b0SSuyog Pawar         c[2] = pi2_tmp[0] - pi2_tmp[3 * trans_size];
165*c83a76b0SSuyog Pawar         c[3] = 74 * pi2_tmp[trans_size];
166*c83a76b0SSuyog Pawar 
167*c83a76b0SSuyog Pawar         itrans_out =
168*c83a76b0SSuyog Pawar                         CLIP_S16((29 * c[0] + 55 * c[1] + c[3] + add) >> shift);
169*c83a76b0SSuyog Pawar         pu1_dst[0] = CLIP_U8((itrans_out + pu1_pred[0]));
170*c83a76b0SSuyog Pawar         itrans_out =
171*c83a76b0SSuyog Pawar                         CLIP_S16((55 * c[2] - 29 * c[1] + c[3] + add) >> shift);
172*c83a76b0SSuyog Pawar         pu1_dst[1] = CLIP_U8((itrans_out + pu1_pred[1]));
173*c83a76b0SSuyog Pawar         itrans_out =
174*c83a76b0SSuyog Pawar                         CLIP_S16((74 * (pi2_tmp[0] - pi2_tmp[2 * trans_size] + pi2_tmp[3 * trans_size]) + add) >> shift);
175*c83a76b0SSuyog Pawar         pu1_dst[2] = CLIP_U8((itrans_out + pu1_pred[2]));
176*c83a76b0SSuyog Pawar         itrans_out =
177*c83a76b0SSuyog Pawar                         CLIP_S16((55 * c[0] + 29 * c[2] - c[3] + add) >> shift);
178*c83a76b0SSuyog Pawar         pu1_dst[3] = CLIP_U8((itrans_out + pu1_pred[3]));
179*c83a76b0SSuyog Pawar         pi2_tmp++;
180*c83a76b0SSuyog Pawar         pu1_pred += pred_strd;
181*c83a76b0SSuyog Pawar         pu1_dst += dst_strd;
182*c83a76b0SSuyog Pawar     }
183*c83a76b0SSuyog Pawar }
184*c83a76b0SSuyog Pawar 
185*c83a76b0SSuyog Pawar /**
186*c83a76b0SSuyog Pawar  *******************************************************************************
187*c83a76b0SSuyog Pawar  *
188*c83a76b0SSuyog Pawar  * @brief
189*c83a76b0SSuyog Pawar  *  This function performs Inverse transform  and reconstruction for 4x4
190*c83a76b0SSuyog Pawar  * input block
191*c83a76b0SSuyog Pawar  *
192*c83a76b0SSuyog Pawar  * @par Description:
193*c83a76b0SSuyog Pawar  *  Performs inverse transform and adds the prediction  data and clips output
194*c83a76b0SSuyog Pawar  * to 8 bit
195*c83a76b0SSuyog Pawar  *
196*c83a76b0SSuyog Pawar  * @param[in] pi2_src
197*c83a76b0SSuyog Pawar  *  Input 4x4 coefficients
198*c83a76b0SSuyog Pawar  *
199*c83a76b0SSuyog Pawar  * @param[in] pi2_tmp
200*c83a76b0SSuyog Pawar  *  Temporary 4x4 buffer for storing inverse
201*c83a76b0SSuyog Pawar  *
202*c83a76b0SSuyog Pawar  *  transform
203*c83a76b0SSuyog Pawar  *  1st stage output
204*c83a76b0SSuyog Pawar  *
205*c83a76b0SSuyog Pawar  * @param[in] pu1_pred
206*c83a76b0SSuyog Pawar  *  Prediction 4x4 block
207*c83a76b0SSuyog Pawar  *
208*c83a76b0SSuyog Pawar  * @param[out] pu1_dst
209*c83a76b0SSuyog Pawar  *  Output 4x4 block
210*c83a76b0SSuyog Pawar  *
211*c83a76b0SSuyog Pawar  * @param[in] src_strd
212*c83a76b0SSuyog Pawar  *  Input stride
213*c83a76b0SSuyog Pawar  *
214*c83a76b0SSuyog Pawar  * @param[in] pred_strd
215*c83a76b0SSuyog Pawar  *  Prediction stride
216*c83a76b0SSuyog Pawar  *
217*c83a76b0SSuyog Pawar  * @param[in] dst_strd
218*c83a76b0SSuyog Pawar  *  Output Stride
219*c83a76b0SSuyog Pawar  *
220*c83a76b0SSuyog Pawar  * @param[in] shift
221*c83a76b0SSuyog Pawar  *  Output shift
222*c83a76b0SSuyog Pawar  *
223*c83a76b0SSuyog Pawar  * @param[in] zero_cols
224*c83a76b0SSuyog Pawar  *  Zero columns in pi2_src
225*c83a76b0SSuyog Pawar  *
226*c83a76b0SSuyog Pawar  * @returns  Void
227*c83a76b0SSuyog Pawar  *
228*c83a76b0SSuyog Pawar  * @remarks
229*c83a76b0SSuyog Pawar  *  None
230*c83a76b0SSuyog Pawar  *
231*c83a76b0SSuyog Pawar  *******************************************************************************
232*c83a76b0SSuyog Pawar  */
233*c83a76b0SSuyog Pawar 
ihevc_itrans_recon_4x4(WORD16 * pi2_src,WORD16 * pi2_tmp,UWORD8 * pu1_pred,UWORD8 * pu1_dst,WORD32 src_strd,WORD32 pred_strd,WORD32 dst_strd,WORD32 zero_cols,WORD32 zero_rows)234*c83a76b0SSuyog Pawar void ihevc_itrans_recon_4x4(WORD16 *pi2_src,
235*c83a76b0SSuyog Pawar                             WORD16 *pi2_tmp,
236*c83a76b0SSuyog Pawar                             UWORD8 *pu1_pred,
237*c83a76b0SSuyog Pawar                             UWORD8 *pu1_dst,
238*c83a76b0SSuyog Pawar                             WORD32 src_strd,
239*c83a76b0SSuyog Pawar                             WORD32 pred_strd,
240*c83a76b0SSuyog Pawar                             WORD32 dst_strd,
241*c83a76b0SSuyog Pawar                             WORD32 zero_cols,
242*c83a76b0SSuyog Pawar                             WORD32 zero_rows)
243*c83a76b0SSuyog Pawar 
244*c83a76b0SSuyog Pawar {
245*c83a76b0SSuyog Pawar     WORD32 j;
246*c83a76b0SSuyog Pawar     WORD32 e[2], o[2];
247*c83a76b0SSuyog Pawar     WORD32 add;
248*c83a76b0SSuyog Pawar     WORD32 shift;
249*c83a76b0SSuyog Pawar     WORD16 *pi2_tmp_orig;
250*c83a76b0SSuyog Pawar     WORD32 trans_size;
251*c83a76b0SSuyog Pawar     UNUSED(zero_rows);
252*c83a76b0SSuyog Pawar     trans_size = TRANS_SIZE_4;
253*c83a76b0SSuyog Pawar 
254*c83a76b0SSuyog Pawar     pi2_tmp_orig = pi2_tmp;
255*c83a76b0SSuyog Pawar 
256*c83a76b0SSuyog Pawar     /* Inverse Transform 1st stage */
257*c83a76b0SSuyog Pawar     shift = IT_SHIFT_STAGE_1;
258*c83a76b0SSuyog Pawar     add = 1 << (shift - 1);
259*c83a76b0SSuyog Pawar 
260*c83a76b0SSuyog Pawar     for(j = 0; j < trans_size; j++)
261*c83a76b0SSuyog Pawar     {
262*c83a76b0SSuyog Pawar         /* Checking for Zero Cols */
263*c83a76b0SSuyog Pawar         if((zero_cols & 1) == 1)
264*c83a76b0SSuyog Pawar         {
265*c83a76b0SSuyog Pawar             memset(pi2_tmp, 0, trans_size * sizeof(WORD16));
266*c83a76b0SSuyog Pawar         }
267*c83a76b0SSuyog Pawar         else
268*c83a76b0SSuyog Pawar         {
269*c83a76b0SSuyog Pawar 
270*c83a76b0SSuyog Pawar             /* Utilizing symmetry properties to the maximum to minimize the number of multiplications */
271*c83a76b0SSuyog Pawar             o[0] = g_ai2_ihevc_trans_4[1][0] * pi2_src[src_strd]
272*c83a76b0SSuyog Pawar                             + g_ai2_ihevc_trans_4[3][0] * pi2_src[3 * src_strd];
273*c83a76b0SSuyog Pawar             o[1] = g_ai2_ihevc_trans_4[1][1] * pi2_src[src_strd]
274*c83a76b0SSuyog Pawar                             + g_ai2_ihevc_trans_4[3][1] * pi2_src[3 * src_strd];
275*c83a76b0SSuyog Pawar             e[0] = g_ai2_ihevc_trans_4[0][0] * pi2_src[0]
276*c83a76b0SSuyog Pawar                             + g_ai2_ihevc_trans_4[2][0] * pi2_src[2 * src_strd];
277*c83a76b0SSuyog Pawar             e[1] = g_ai2_ihevc_trans_4[0][1] * pi2_src[0]
278*c83a76b0SSuyog Pawar                             + g_ai2_ihevc_trans_4[2][1] * pi2_src[2 * src_strd];
279*c83a76b0SSuyog Pawar 
280*c83a76b0SSuyog Pawar             pi2_tmp[0] =
281*c83a76b0SSuyog Pawar                             CLIP_S16(((e[0] + o[0] + add) >> shift));
282*c83a76b0SSuyog Pawar             pi2_tmp[1] =
283*c83a76b0SSuyog Pawar                             CLIP_S16(((e[1] + o[1] + add) >> shift));
284*c83a76b0SSuyog Pawar             pi2_tmp[2] =
285*c83a76b0SSuyog Pawar                             CLIP_S16(((e[1] - o[1] + add) >> shift));
286*c83a76b0SSuyog Pawar             pi2_tmp[3] =
287*c83a76b0SSuyog Pawar                             CLIP_S16(((e[0] - o[0] + add) >> shift));
288*c83a76b0SSuyog Pawar 
289*c83a76b0SSuyog Pawar         }
290*c83a76b0SSuyog Pawar         pi2_src++;
291*c83a76b0SSuyog Pawar         pi2_tmp += trans_size;
292*c83a76b0SSuyog Pawar         zero_cols = zero_cols >> 1;
293*c83a76b0SSuyog Pawar     }
294*c83a76b0SSuyog Pawar 
295*c83a76b0SSuyog Pawar     pi2_tmp = pi2_tmp_orig;
296*c83a76b0SSuyog Pawar 
297*c83a76b0SSuyog Pawar     /* Inverse Transform 2nd stage */
298*c83a76b0SSuyog Pawar     shift = IT_SHIFT_STAGE_2;
299*c83a76b0SSuyog Pawar     add = 1 << (shift - 1);
300*c83a76b0SSuyog Pawar 
301*c83a76b0SSuyog Pawar     for(j = 0; j < trans_size; j++)
302*c83a76b0SSuyog Pawar     {
303*c83a76b0SSuyog Pawar         WORD32 itrans_out;
304*c83a76b0SSuyog Pawar         /* Utilizing symmetry properties to the maximum to minimize the number of multiplications */
305*c83a76b0SSuyog Pawar         o[0] = g_ai2_ihevc_trans_4[1][0] * pi2_tmp[trans_size]
306*c83a76b0SSuyog Pawar                         + g_ai2_ihevc_trans_4[3][0] * pi2_tmp[3 * trans_size];
307*c83a76b0SSuyog Pawar         o[1] = g_ai2_ihevc_trans_4[1][1] * pi2_tmp[trans_size]
308*c83a76b0SSuyog Pawar                         + g_ai2_ihevc_trans_4[3][1] * pi2_tmp[3 * trans_size];
309*c83a76b0SSuyog Pawar         e[0] = g_ai2_ihevc_trans_4[0][0] * pi2_tmp[0]
310*c83a76b0SSuyog Pawar                         + g_ai2_ihevc_trans_4[2][0] * pi2_tmp[2 * trans_size];
311*c83a76b0SSuyog Pawar         e[1] = g_ai2_ihevc_trans_4[0][1] * pi2_tmp[0]
312*c83a76b0SSuyog Pawar                         + g_ai2_ihevc_trans_4[2][1] * pi2_tmp[2 * trans_size];
313*c83a76b0SSuyog Pawar 
314*c83a76b0SSuyog Pawar         itrans_out =
315*c83a76b0SSuyog Pawar                         CLIP_S16(((e[0] + o[0] + add) >> shift));
316*c83a76b0SSuyog Pawar         pu1_dst[0] = CLIP_U8((itrans_out + pu1_pred[0]));
317*c83a76b0SSuyog Pawar         itrans_out =
318*c83a76b0SSuyog Pawar                         CLIP_S16(((e[1] + o[1] + add) >> shift));
319*c83a76b0SSuyog Pawar         pu1_dst[1] = CLIP_U8((itrans_out + pu1_pred[1]));
320*c83a76b0SSuyog Pawar         itrans_out =
321*c83a76b0SSuyog Pawar                         CLIP_S16(((e[1] - o[1] + add) >> shift));
322*c83a76b0SSuyog Pawar         pu1_dst[2] = CLIP_U8((itrans_out + pu1_pred[2]));
323*c83a76b0SSuyog Pawar         itrans_out =
324*c83a76b0SSuyog Pawar                         CLIP_S16(((e[0] - o[0] + add) >> shift));
325*c83a76b0SSuyog Pawar         pu1_dst[3] = CLIP_U8((itrans_out + pu1_pred[3]));
326*c83a76b0SSuyog Pawar 
327*c83a76b0SSuyog Pawar         pi2_tmp++;
328*c83a76b0SSuyog Pawar         pu1_pred += pred_strd;
329*c83a76b0SSuyog Pawar         pu1_dst += dst_strd;
330*c83a76b0SSuyog Pawar 
331*c83a76b0SSuyog Pawar     }
332*c83a76b0SSuyog Pawar }
333*c83a76b0SSuyog Pawar 
334