1 /*
2  *  Copyright (c) 2010 The WebM project authors. All Rights Reserved.
3  *
4  *  Use of this source code is governed by a BSD-style license
5  *  that can be found in the LICENSE file in the root of the source
6  *  tree. An additional intellectual property rights grant can be found
7  *  in the file PATENTS.  All contributing project authors may
8  *  be found in the AUTHORS file in the root of the source tree.
9  */
10 
11 #ifndef VP9_COMMON_VP9_IDCT_H_
12 #define VP9_COMMON_VP9_IDCT_H_
13 
14 #include <assert.h>
15 
16 #include "./vpx_config.h"
17 #include "vpx/vpx_integer.h"
18 #include "vp9/common/vp9_common.h"
19 #include "vp9/common/vp9_enums.h"
20 
21 #ifdef __cplusplus
22 extern "C" {
23 #endif
24 
25 
26 // Constants and Macros used by all idct/dct functions
27 #define DCT_CONST_BITS 14
28 #define DCT_CONST_ROUNDING  (1 << (DCT_CONST_BITS - 1))
29 
30 #define UNIT_QUANT_SHIFT 2
31 #define UNIT_QUANT_FACTOR (1 << UNIT_QUANT_SHIFT)
32 
33 #define pair_set_epi16(a, b) \
34   _mm_set_epi16(b, a, b, a, b, a, b, a)
35 
36 #define dual_set_epi16(a, b) \
37   _mm_set_epi16(b, b, b, b, a, a, a, a)
38 
39 // Constants:
40 //  for (int i = 1; i< 32; ++i)
41 //    printf("static const int cospi_%d_64 = %.0f;\n", i,
42 //           round(16384 * cos(i*M_PI/64)));
43 // Note: sin(k*Pi/64) = cos((32-k)*Pi/64)
44 static const int cospi_1_64  = 16364;
45 static const int cospi_2_64  = 16305;
46 static const int cospi_3_64  = 16207;
47 static const int cospi_4_64  = 16069;
48 static const int cospi_5_64  = 15893;
49 static const int cospi_6_64  = 15679;
50 static const int cospi_7_64  = 15426;
51 static const int cospi_8_64  = 15137;
52 static const int cospi_9_64  = 14811;
53 static const int cospi_10_64 = 14449;
54 static const int cospi_11_64 = 14053;
55 static const int cospi_12_64 = 13623;
56 static const int cospi_13_64 = 13160;
57 static const int cospi_14_64 = 12665;
58 static const int cospi_15_64 = 12140;
59 static const int cospi_16_64 = 11585;
60 static const int cospi_17_64 = 11003;
61 static const int cospi_18_64 = 10394;
62 static const int cospi_19_64 = 9760;
63 static const int cospi_20_64 = 9102;
64 static const int cospi_21_64 = 8423;
65 static const int cospi_22_64 = 7723;
66 static const int cospi_23_64 = 7005;
67 static const int cospi_24_64 = 6270;
68 static const int cospi_25_64 = 5520;
69 static const int cospi_26_64 = 4756;
70 static const int cospi_27_64 = 3981;
71 static const int cospi_28_64 = 3196;
72 static const int cospi_29_64 = 2404;
73 static const int cospi_30_64 = 1606;
74 static const int cospi_31_64 = 804;
75 
76 //  16384 * sqrt(2) * sin(kPi/9) * 2 / 3
77 static const int sinpi_1_9 = 5283;
78 static const int sinpi_2_9 = 9929;
79 static const int sinpi_3_9 = 13377;
80 static const int sinpi_4_9 = 15212;
81 
dct_const_round_shift(int input)82 static INLINE int dct_const_round_shift(int input) {
83   int rv = ROUND_POWER_OF_TWO(input, DCT_CONST_BITS);
84 #if CONFIG_COEFFICIENT_RANGE_CHECKING
85   // For valid VP9 input streams, intermediate stage coefficients should always
86   // stay within the range of a signed 16 bit integer. Coefficients can go out
87   // of this range for invalid/corrupt VP9 streams. However, strictly checking
88   // this range for every intermediate coefficient can burdensome for a decoder,
89   // therefore the following assertion is only enabled when configured with
90   // --enable-coefficient-range-checking.
91   assert(INT16_MIN <= rv);
92   assert(rv <= INT16_MAX);
93 #endif
94   return (int16_t)rv;
95 }
96 
97 typedef void (*transform_1d)(const int16_t*, int16_t*);
98 
99 typedef struct {
100   transform_1d cols, rows;  // vertical and horizontal
101 } transform_2d;
102 
103 void vp9_iwht4x4_add(const int16_t *input, uint8_t *dest, int stride, int eob);
104 
105 void vp9_idct4x4_add(const int16_t *input, uint8_t *dest, int stride, int eob);
106 void vp9_idct8x8_add(const int16_t *input, uint8_t *dest, int stride, int eob);
107 void vp9_idct16x16_add(const int16_t *input, uint8_t *dest, int stride, int
108                        eob);
109 void vp9_idct32x32_add(const int16_t *input, uint8_t *dest, int stride,
110                        int eob);
111 
112 void vp9_iht4x4_add(TX_TYPE tx_type, const int16_t *input, uint8_t *dest,
113                     int stride, int eob);
114 void vp9_iht8x8_add(TX_TYPE tx_type, const int16_t *input, uint8_t *dest,
115                     int stride, int eob);
116 void vp9_iht16x16_add(TX_TYPE tx_type, const int16_t *input, uint8_t *dest,
117                       int stride, int eob);
118 
119 
120 #ifdef __cplusplus
121 }  // extern "C"
122 #endif
123 
124 #endif  // VP9_COMMON_VP9_IDCT_H_
125