1 /*
2  * Copyright © 2014 Broadcom
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21  * IN THE SOFTWARE.
22  */
23 
24 #ifndef VC4_TILING_H
25 #define VC4_TILING_H
26 
27 #include <stdbool.h>
28 #include <stdint.h>
29 #include "util/macros.h"
30 #include "util/u_cpu_detect.h"
31 
32 /** Return the width in pixels of a 64-byte microtile. */
33 static inline uint32_t
vc4_utile_width(int cpp)34 vc4_utile_width(int cpp)
35 {
36         switch (cpp) {
37         case 1:
38         case 2:
39                 return 8;
40         case 4:
41                 return 4;
42         case 8:
43                 return 2;
44         default:
45                 unreachable("unknown cpp");
46         }
47 }
48 
49 /** Return the height in pixels of a 64-byte microtile. */
50 static inline uint32_t
vc4_utile_height(int cpp)51 vc4_utile_height(int cpp)
52 {
53         switch (cpp) {
54         case 1:
55                 return 8;
56         case 2:
57         case 4:
58         case 8:
59                 return 4;
60         default:
61                 unreachable("unknown cpp");
62         }
63 }
64 
65 bool vc4_size_is_lt(uint32_t width, uint32_t height, int cpp) ATTRIBUTE_CONST;
66 void vc4_load_lt_image_base(void *dst, uint32_t dst_stride,
67                             void *src, uint32_t src_stride,
68                             int cpp, const struct pipe_box *box);
69 void vc4_store_lt_image_base(void *dst, uint32_t dst_stride,
70                              void *src, uint32_t src_stride,
71                              int cpp, const struct pipe_box *box);
72 void vc4_load_lt_image_neon(void *dst, uint32_t dst_stride,
73                             void *src, uint32_t src_stride,
74                             int cpp, const struct pipe_box *box);
75 void vc4_store_lt_image_neon(void *dst, uint32_t dst_stride,
76                              void *src, uint32_t src_stride,
77                              int cpp, const struct pipe_box *box);
78 void vc4_load_tiled_image(void *dst, uint32_t dst_stride,
79                           void *src, uint32_t src_stride,
80                           uint8_t tiling_format, int cpp,
81                           const struct pipe_box *box);
82 void vc4_store_tiled_image(void *dst, uint32_t dst_stride,
83                            void *src, uint32_t src_stride,
84                            uint8_t tiling_format, int cpp,
85                            const struct pipe_box *box);
86 
87 static inline void
vc4_load_lt_image(void * dst,uint32_t dst_stride,void * src,uint32_t src_stride,int cpp,const struct pipe_box * box)88 vc4_load_lt_image(void *dst, uint32_t dst_stride,
89                   void *src, uint32_t src_stride,
90                   int cpp, const struct pipe_box *box)
91 {
92 #ifdef USE_ARM_ASM
93         if (util_cpu_caps.has_neon) {
94                 vc4_load_lt_image_neon(dst, dst_stride, src, src_stride,
95                                        cpp, box);
96                 return;
97         }
98 #endif
99         vc4_load_lt_image_base(dst, dst_stride, src, src_stride,
100                                cpp, box);
101 }
102 
103 static inline void
vc4_store_lt_image(void * dst,uint32_t dst_stride,void * src,uint32_t src_stride,int cpp,const struct pipe_box * box)104 vc4_store_lt_image(void *dst, uint32_t dst_stride,
105                    void *src, uint32_t src_stride,
106                    int cpp, const struct pipe_box *box)
107 {
108 #ifdef USE_ARM_ASM
109         if (util_cpu_caps.has_neon) {
110                 vc4_store_lt_image_neon(dst, dst_stride, src, src_stride,
111                                         cpp, box);
112                 return;
113         }
114 #endif
115 
116         vc4_store_lt_image_base(dst, dst_stride, src, src_stride,
117                                 cpp, box);
118 }
119 
120 #endif /* VC4_TILING_H */
121