1 /******************************************************************************
2  *
3  * Copyright (C) 2015 The Android Open Source Project
4  *
5  * Licensed under the Apache License, Version 2.0 (the "License");
6  * you may not use this file except in compliance with the License.
7  * You may obtain a copy of the License at:
8  *
9  * http://www.apache.org/licenses/LICENSE-2.0
10  *
11  * Unless required by applicable law or agreed to in writing, software
12  * distributed under the License is distributed on an "AS IS" BASIS,
13  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14  * See the License for the specific language governing permissions and
15  * limitations under the License.
16  *
17  *****************************************************************************
18  * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore
19 */
20 /**
21  *******************************************************************************
22  * @file
23  *  ih264_ihadamard_scaling.c
24  *
25  * @brief
26  *  Contains definition of functions for h264 inverse hadamard 4x4 transform and scaling
27  *
28  * @author
29  *  Mohit
30  *
31  *  @par List of Functions:
32  *  - ih264_ihadamard_scaling_4x4()
33  *
34  * @remarks
35  *
36  *******************************************************************************
37  */
38 
39 /*****************************************************************************/
40 /* File Includes                                                             */
41 /*****************************************************************************/
42 
43 /* User include files */
44 #include "ih264_typedefs.h"
45 #include "ih264_defs.h"
46 #include "ih264_trans_macros.h"
47 #include "ih264_macros.h"
48 #include "ih264_trans_data.h"
49 #include "ih264_size_defs.h"
50 #include "ih264_structs.h"
51 #include "ih264_trans_quant_itrans_iquant.h"
52 
53 /*
54  ********************************************************************************
55  *
56  * @brief This function performs a 4x4 inverse hadamard transform on the 4x4 DC coefficients
57  * of a 16x16 intra prediction macroblock, and then performs scaling.
58  * prediction buffer
59  *
60  * @par Description:
61  *  The DC coefficients pass through a 2-stage inverse hadamard transform.
62  *  This inverse transformed content is scaled to based on Qp value.
63  *
64  * @param[in] pi2_src
65  *  input 4x4 block of DC coefficients
66  *
67  * @param[out] pi2_out
68  *  output 4x4 block
69  *
70  * @param[in] pu2_iscal_mat
71  *  pointer to scaling list
72  *
73  * @param[in] pu2_weigh_mat
74  *  pointer to weight matrix
75  *
76  * @param[in] u4_qp_div_6
77  *  Floor (qp/6)
78  *
79  * @param[in] pi4_tmp
80  * temporary buffer of size 1*16
81  *
82  * @returns none
83  *
84  * @remarks none
85  *
86  *******************************************************************************
87  */
ih264_ihadamard_scaling_4x4(WORD16 * pi2_src,WORD16 * pi2_out,const UWORD16 * pu2_iscal_mat,const UWORD16 * pu2_weigh_mat,UWORD32 u4_qp_div_6,WORD32 * pi4_tmp)88 void ih264_ihadamard_scaling_4x4(WORD16* pi2_src,
89                                  WORD16* pi2_out,
90                                  const UWORD16 *pu2_iscal_mat,
91                                  const UWORD16 *pu2_weigh_mat,
92                                  UWORD32 u4_qp_div_6,
93                                  WORD32* pi4_tmp)
94 {
95     WORD32 i;
96     WORD32 x0, x1, x2, x3, x4, x5, x6, x7;
97     WORD16* pi2_src_ptr, *pi2_out_ptr;
98     WORD32* pi4_tmp_ptr;
99     WORD32 rnd_fact = (u4_qp_div_6 < 6) ? (1 << (5 - u4_qp_div_6)) : 0;
100     pi4_tmp_ptr = pi4_tmp;
101     pi2_src_ptr = pi2_src;
102     pi2_out_ptr = pi2_out;
103     // Horizontal transform
104     for(i = 0; i < SUB_BLK_WIDTH_4x4; i++)
105     {
106         x4 = pi2_src_ptr[0];
107         x5 = pi2_src_ptr[1];
108         x6 = pi2_src_ptr[2];
109         x7 = pi2_src_ptr[3];
110 
111         x0 = x4 + x7;
112         x1 = x5 + x6;
113         x2 = x5 - x6;
114         x3 = x4 - x7;
115 
116         pi4_tmp_ptr[0] = x0 + x1;
117         pi4_tmp_ptr[1] = x2 + x3;
118         pi4_tmp_ptr[2] = x0 - x1;
119         pi4_tmp_ptr[3] = x3 - x2;
120 
121         pi4_tmp_ptr += SUB_BLK_WIDTH_4x4;
122         pi2_src_ptr += SUB_BLK_WIDTH_4x4;
123     }
124     pi4_tmp_ptr = pi4_tmp;
125     // Vertical Transform
126     for(i = 0; i < SUB_BLK_WIDTH_4x4; i++)
127     {
128         x4 = pi4_tmp_ptr[0];
129         x5 = pi4_tmp_ptr[4];
130         x6 = pi4_tmp_ptr[8];
131         x7 = pi4_tmp_ptr[12];
132 
133         x0 = x4 + x7;
134         x1 = x5 + x6;
135         x2 = x5 - x6;
136         x3 = x4 - x7;
137 
138         pi4_tmp_ptr[0] = x0 + x1;
139         pi4_tmp_ptr[4] = x2 + x3;
140         pi4_tmp_ptr[8] = x0 - x1;
141         pi4_tmp_ptr[12] = x3 - x2;
142 
143         pi4_tmp_ptr++;
144     }
145     pi4_tmp_ptr = pi4_tmp;
146     //Scaling
147     for(i = 0; i < (SUB_BLK_WIDTH_4x4 * SUB_BLK_WIDTH_4x4); i++)
148     {
149       INV_QUANT(pi4_tmp_ptr[i], pu2_iscal_mat[0], pu2_weigh_mat[0], u4_qp_div_6,
150                 rnd_fact, 6);
151       pi2_out_ptr[i] = pi4_tmp_ptr[i];
152     }
153 }
154 
ih264_ihadamard_scaling_2x2_uv(WORD16 * pi2_src,WORD16 * pi2_out,const UWORD16 * pu2_iscal_mat,const UWORD16 * pu2_weigh_mat,UWORD32 u4_qp_div_6,WORD32 * pi4_tmp)155 void ih264_ihadamard_scaling_2x2_uv(WORD16* pi2_src,
156                                     WORD16* pi2_out,
157                                     const UWORD16 *pu2_iscal_mat,
158                                     const UWORD16 *pu2_weigh_mat,
159                                     UWORD32 u4_qp_div_6,
160                                     WORD32* pi4_tmp)
161 {
162   WORD32 i4_x0,i4_x1,i4_x2,i4_x3,i4_x4,i4_x5,i4_x6,i4_x7;
163   WORD32 i4_y0,i4_y1,i4_y2,i4_y3,i4_y4,i4_y5,i4_y6,i4_y7;
164 
165   UNUSED(pi4_tmp);
166 
167   i4_x4 = pi2_src[0];
168   i4_x5 = pi2_src[1];
169   i4_x6 = pi2_src[2];
170   i4_x7 = pi2_src[3];
171 
172   i4_x0 = i4_x4 + i4_x5;
173   i4_x1 = i4_x4 - i4_x5;
174   i4_x2 = i4_x6 + i4_x7;
175   i4_x3 = i4_x6 - i4_x7;
176 
177   i4_x4 = i4_x0+i4_x2;
178   i4_x5 = i4_x1+i4_x3;
179   i4_x6 = i4_x0-i4_x2;
180   i4_x7 = i4_x1-i4_x3;
181 
182   INV_QUANT(i4_x4,pu2_iscal_mat[0],pu2_weigh_mat[0],u4_qp_div_6,0,5);
183   INV_QUANT(i4_x5,pu2_iscal_mat[0],pu2_weigh_mat[0],u4_qp_div_6,0,5);
184   INV_QUANT(i4_x6,pu2_iscal_mat[0],pu2_weigh_mat[0],u4_qp_div_6,0,5);
185   INV_QUANT(i4_x7,pu2_iscal_mat[0],pu2_weigh_mat[0],u4_qp_div_6,0,5);
186 
187   pi2_out[0] = i4_x4;
188   pi2_out[1] = i4_x5;
189   pi2_out[2] = i4_x6;
190   pi2_out[3] = i4_x7;
191 
192   i4_y4 = pi2_src[4];
193   i4_y5 = pi2_src[5];
194   i4_y6 = pi2_src[6];
195   i4_y7 = pi2_src[7];
196 
197   i4_y0 = i4_y4 + i4_y5;
198   i4_y1 = i4_y4 - i4_y5;
199   i4_y2 = i4_y6 + i4_y7;
200   i4_y3 = i4_y6 - i4_y7;
201 
202   i4_y4 = i4_y0+i4_y2;
203   i4_y5 = i4_y1+i4_y3;
204   i4_y6 = i4_y0-i4_y2;
205   i4_y7 = i4_y1-i4_y3;
206 
207   INV_QUANT(i4_y4,pu2_iscal_mat[0],pu2_weigh_mat[0],u4_qp_div_6,0,5);
208   INV_QUANT(i4_y5,pu2_iscal_mat[0],pu2_weigh_mat[0],u4_qp_div_6,0,5);
209   INV_QUANT(i4_y6,pu2_iscal_mat[0],pu2_weigh_mat[0],u4_qp_div_6,0,5);
210   INV_QUANT(i4_y7,pu2_iscal_mat[0],pu2_weigh_mat[0],u4_qp_div_6,0,5);
211 
212   pi2_out[4] = i4_y4;
213   pi2_out[5] = i4_y5;
214   pi2_out[6] = i4_y6;
215   pi2_out[7] = i4_y7;
216 }
217