1 /*
2 * Copyright (c) 2013 The WebM project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
11 #ifndef VP9_COMMON_MIPS_DSPR2_VP9_COMMON_DSPR2_H_
12 #define VP9_COMMON_MIPS_DSPR2_VP9_COMMON_DSPR2_H_
13
14 #include <assert.h>
15
16 #include "./vpx_config.h"
17 #include "vpx/vpx_integer.h"
18 #include "vp9/common/vp9_common.h"
19
20 #ifdef __cplusplus
21 extern "C" {
22 #endif
23
24 #if HAVE_DSPR2
25 #define CROP_WIDTH 512
26 extern uint8_t *vp9_ff_cropTbl;
27
28 #define DCT_CONST_ROUND_SHIFT_TWICE_COSPI_16_64(input) ({ \
29 \
30 int32_t tmp, out; \
31 int dct_cost_rounding = DCT_CONST_ROUNDING; \
32 int in = input; \
33 \
34 __asm__ __volatile__ ( \
35 /* out = dct_const_round_shift(input_dc * cospi_16_64); */ \
36 "mtlo %[dct_cost_rounding], $ac1 \n\t"\
37 "mthi $zero, $ac1 \n\t"\
38 "madd $ac1, %[in], %[cospi_16_64] \n\t"\
39 "extp %[tmp], $ac1, 31 \n\t"\
40 \
41 /* out = dct_const_round_shift(out * cospi_16_64); */ \
42 "mtlo %[dct_cost_rounding], $ac2 \n\t"\
43 "mthi $zero, $ac2 \n\t"\
44 "madd $ac2, %[tmp], %[cospi_16_64] \n\t"\
45 "extp %[out], $ac2, 31 \n\t"\
46 \
47 : [tmp] "=&r" (tmp), [out] "=r" (out) \
48 : [in] "r" (in), \
49 [dct_cost_rounding] "r" (dct_cost_rounding), \
50 [cospi_16_64] "r" (cospi_16_64) \
51 ); \
52 out; })
53
vp9_prefetch_load(const unsigned char * src)54 static INLINE void vp9_prefetch_load(const unsigned char *src) {
55 __asm__ __volatile__ (
56 "pref 0, 0(%[src]) \n\t"
57 :
58 : [src] "r" (src)
59 );
60 }
61
62 /* prefetch data for store */
vp9_prefetch_store(unsigned char * dst)63 static INLINE void vp9_prefetch_store(unsigned char *dst) {
64 __asm__ __volatile__ (
65 "pref 1, 0(%[dst]) \n\t"
66 :
67 : [dst] "r" (dst)
68 );
69 }
70
vp9_prefetch_load_streamed(const unsigned char * src)71 static INLINE void vp9_prefetch_load_streamed(const unsigned char *src) {
72 __asm__ __volatile__ (
73 "pref 4, 0(%[src]) \n\t"
74 :
75 : [src] "r" (src)
76 );
77 }
78
79 /* prefetch data for store */
vp9_prefetch_store_streamed(unsigned char * dst)80 static INLINE void vp9_prefetch_store_streamed(unsigned char *dst) {
81 __asm__ __volatile__ (
82 "pref 5, 0(%[dst]) \n\t"
83 :
84 : [dst] "r" (dst)
85 );
86 }
87
88 void vp9_idct32_cols_add_blk_dspr2(int16_t *input, uint8_t *dest,
89 int dest_stride);
90
91 void vp9_convolve2_horiz_dspr2(const uint8_t *src, ptrdiff_t src_stride,
92 uint8_t *dst, ptrdiff_t dst_stride,
93 const int16_t *filter_x, int x_step_q4,
94 const int16_t *filter_y, int y_step_q4,
95 int w, int h);
96
97 void vp9_convolve2_avg_horiz_dspr2(const uint8_t *src, ptrdiff_t src_stride,
98 uint8_t *dst, ptrdiff_t dst_stride,
99 const int16_t *filter_x, int x_step_q4,
100 const int16_t *filter_y, int y_step_q4,
101 int w, int h);
102
103 void vp9_convolve2_avg_vert_dspr2(const uint8_t *src, ptrdiff_t src_stride,
104 uint8_t *dst, ptrdiff_t dst_stride,
105 const int16_t *filter_x, int x_step_q4,
106 const int16_t *filter_y, int y_step_q4,
107 int w, int h);
108
109 void vp9_convolve2_dspr2(const uint8_t *src, ptrdiff_t src_stride,
110 uint8_t *dst, ptrdiff_t dst_stride,
111 const int16_t *filter,
112 int w, int h);
113
114 void vp9_convolve2_vert_dspr2(const uint8_t *src, ptrdiff_t src_stride,
115 uint8_t *dst, ptrdiff_t dst_stride,
116 const int16_t *filter_x, int x_step_q4,
117 const int16_t *filter_y, int y_step_q4,
118 int w, int h);
119
120 #endif // #if HAVE_DSPR2
121 #ifdef __cplusplus
122 } // extern "C"
123 #endif
124
125 #endif // VP9_COMMON_MIPS_DSPR2_VP9_COMMON_DSPR2_H_
126