1 /*
2  * Copyright © 2014-2018 Broadcom
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21  * IN THE SOFTWARE.
22  */
23 
24 #include "util/u_format.h"
25 
26 #include "vc5_context.h"
27 #include "broadcom/cle/v3dx_pack.h"
28 #include "broadcom/common/v3d_macros.h"
29 #include "vc5_format_table.h"
30 
31 #define SWIZ(x,y,z,w) {          \
32         PIPE_SWIZZLE_##x, \
33         PIPE_SWIZZLE_##y, \
34         PIPE_SWIZZLE_##z, \
35         PIPE_SWIZZLE_##w  \
36 }
37 
38 #define FORMAT(pipe, rt, tex, swiz, return_size, return_channels)       \
39         [PIPE_FORMAT_##pipe] = {                                        \
40                 true,                                                   \
41                 V3D_OUTPUT_IMAGE_FORMAT_##rt,                           \
42                 TEXTURE_DATA_FORMAT_##tex,                              \
43                 swiz,                                                   \
44                 return_size,                                            \
45                 return_channels,                                        \
46         }
47 
48 #define SWIZ_X001	SWIZ(X, 0, 0, 1)
49 #define SWIZ_XY01	SWIZ(X, Y, 0, 1)
50 #define SWIZ_XYZ1	SWIZ(X, Y, Z, 1)
51 #define SWIZ_XYZW	SWIZ(X, Y, Z, W)
52 #define SWIZ_YZWX	SWIZ(Y, Z, W, X)
53 #define SWIZ_YZW1	SWIZ(Y, Z, W, 1)
54 #define SWIZ_ZYXW	SWIZ(Z, Y, X, W)
55 #define SWIZ_ZYX1	SWIZ(Z, Y, X, 1)
56 #define SWIZ_XXXY	SWIZ(X, X, X, Y)
57 #define SWIZ_XXX1	SWIZ(X, X, X, 1)
58 #define SWIZ_XXXX	SWIZ(X, X, X, X)
59 #define SWIZ_000X	SWIZ(0, 0, 0, X)
60 
61 static const struct vc5_format format_table[] = {
62         FORMAT(B8G8R8A8_UNORM,    RGBA8,        RGBA8,       SWIZ_ZYXW, 16, 0),
63         FORMAT(B8G8R8X8_UNORM,    RGBA8,        RGBA8,       SWIZ_ZYX1, 16, 0),
64         FORMAT(B8G8R8A8_SRGB,     SRGB8_ALPHA8, RGBA8,       SWIZ_ZYXW, 16, 0),
65         FORMAT(B8G8R8X8_SRGB,     SRGB8_ALPHA8, RGBA8,       SWIZ_ZYX1, 16, 0),
66         FORMAT(R8G8B8A8_UNORM,    RGBA8,        RGBA8,       SWIZ_XYZW, 16, 0),
67         FORMAT(R8G8B8X8_UNORM,    RGBA8,        RGBA8,       SWIZ_XYZ1, 16, 0),
68         FORMAT(R8G8B8A8_SNORM,    NO,           RGBA8_SNORM, SWIZ_XYZW, 16, 0),
69         FORMAT(R8G8B8X8_SNORM,    NO,           RGBA8_SNORM, SWIZ_XYZ1, 16, 0),
70         FORMAT(R10G10B10A2_UNORM, RGB10_A2,     RGB10_A2,    SWIZ_XYZW, 16, 0),
71         FORMAT(B10G10R10A2_UINT,  RGB10_A2UI,   RGB10_A2UI,  SWIZ_ZYXW, 16, 0),
72 
73         FORMAT(B4G4R4A4_UNORM,    ABGR4444,     RGBA4,       SWIZ_YZWX, 16, 0),
74         FORMAT(B4G4R4X4_UNORM,    ABGR4444,     RGBA4,       SWIZ_YZW1, 16, 0),
75 
76         FORMAT(A1B5G5R5_UNORM,    ABGR1555,     RGB5_A1,     SWIZ_XYZW, 16, 0),
77         FORMAT(X1B5G5R5_UNORM,    ABGR1555,     RGB5_A1,     SWIZ_XYZ1, 16, 0),
78         FORMAT(B5G6R5_UNORM,      BGR565,       RGB565,      SWIZ_XYZ1, 16, 0),
79 
80         FORMAT(R8_UNORM,          R8,           R8,          SWIZ_X001, 16, 0),
81         FORMAT(R8_SNORM,          NO,           R8_SNORM,    SWIZ_X001, 16, 0),
82         FORMAT(R8G8_UNORM,        RG8,          RG8,         SWIZ_XY01, 16, 0),
83         FORMAT(R8G8_SNORM,        NO,           RG8_SNORM,   SWIZ_XY01, 16, 0),
84 
85         FORMAT(R16_UNORM,         NO,           R16,         SWIZ_X001, 32, 1),
86         FORMAT(R16_SNORM,         NO,           R16_SNORM,   SWIZ_X001, 32, 1),
87         FORMAT(R16_FLOAT,         R16F,         R16F,        SWIZ_X001, 16, 0),
88         FORMAT(R32_FLOAT,         R32F,         R32F,        SWIZ_X001, 32, 1),
89 
90         FORMAT(R16G16_UNORM,      NO,           RG16,        SWIZ_XY01, 32, 2),
91         FORMAT(R16G16_SNORM,      NO,           RG16_SNORM,  SWIZ_XY01, 32, 2),
92         FORMAT(R16G16_FLOAT,      RG16F,        RG16F,       SWIZ_XY01, 16, 0),
93         FORMAT(R32G32_FLOAT,      RG32F,        RG32F,       SWIZ_XY01, 32, 2),
94 
95         FORMAT(R16G16B16A16_UNORM, NO,          RGBA16,      SWIZ_XYZW, 32, 4),
96         FORMAT(R16G16B16A16_SNORM, NO,          RGBA16_SNORM, SWIZ_XYZW, 32, 4),
97         FORMAT(R16G16B16A16_FLOAT, RGBA16F,     RGBA16F,     SWIZ_XYZW, 16, 0),
98         FORMAT(R32G32B32A32_FLOAT, RGBA32F,     RGBA32F,     SWIZ_XYZW, 32, 4),
99 
100         /* If we don't have L/A/LA16, mesa/st will fall back to RGBA16. */
101         FORMAT(L16_UNORM,         NO,           R16,         SWIZ_XXX1, 32, 1),
102         FORMAT(L16_SNORM,         NO,           R16_SNORM,   SWIZ_XXX1, 32, 1),
103         FORMAT(I16_UNORM,         NO,           R16,         SWIZ_XXXX, 32, 1),
104         FORMAT(I16_SNORM,         NO,           R16_SNORM,   SWIZ_XXXX, 32, 1),
105         FORMAT(A16_UNORM,         NO,           R16,         SWIZ_000X, 32, 1),
106         FORMAT(A16_SNORM,         NO,           R16_SNORM,   SWIZ_000X, 32, 1),
107         FORMAT(L16A16_UNORM,      NO,           RG16,        SWIZ_XXXY, 32, 2),
108         FORMAT(L16A16_SNORM,      NO,           RG16_SNORM,  SWIZ_XXXY, 32, 2),
109 
110         FORMAT(A8_UNORM,          NO,           R8,          SWIZ_000X, 16, 0),
111         FORMAT(L8_UNORM,          NO,           R8,          SWIZ_XXX1, 16, 0),
112         FORMAT(I8_UNORM,          NO,           R8,          SWIZ_XXXX, 16, 0),
113         FORMAT(L8A8_UNORM,        NO,           RG8,         SWIZ_XXXY, 16, 0),
114 
115         FORMAT(R8_SINT,           R8I,          R8I,         SWIZ_X001, 16, 0),
116         FORMAT(R8_UINT,           R8UI,         R8UI,        SWIZ_X001, 16, 0),
117         FORMAT(R8G8_SINT,         RG8I,         RG8I,        SWIZ_XY01, 16, 0),
118         FORMAT(R8G8_UINT,         RG8UI,        RG8UI,       SWIZ_XY01, 16, 0),
119         FORMAT(R8G8B8A8_SINT,     RGBA8I,       RGBA8I,      SWIZ_XYZW, 16, 0),
120         FORMAT(R8G8B8A8_UINT,     RGBA8UI,      RGBA8UI,     SWIZ_XYZW, 16, 0),
121 
122         FORMAT(R16_SINT,          R16I,         R16I,        SWIZ_X001, 16, 0),
123         FORMAT(R16_UINT,          R16UI,        R16UI,       SWIZ_X001, 16, 0),
124         FORMAT(R16G16_SINT,       RG16I,        R16I,        SWIZ_XY01, 16, 0),
125         FORMAT(R16G16_UINT,       RG16UI,       R16UI,       SWIZ_XY01, 16, 0),
126         FORMAT(R16G16B16A16_SINT, RGBA16I,      RGBA16I,     SWIZ_XYZW, 16, 0),
127         FORMAT(R16G16B16A16_UINT, RGBA16UI,     RGBA16UI,    SWIZ_XYZW, 16, 0),
128 
129         FORMAT(R32_SINT,          R32I,         R32I,        SWIZ_X001, 32, 1),
130         FORMAT(R32_UINT,          R32UI,        R32UI,       SWIZ_X001, 32, 1),
131         FORMAT(R32G32_SINT,       RG32I,        RG32I,       SWIZ_XY01, 32, 2),
132         FORMAT(R32G32_UINT,       RG32UI,       RG32UI,      SWIZ_XY01, 32, 2),
133         FORMAT(R32G32B32A32_SINT, RGBA32I,      RGBA32I,     SWIZ_XYZW, 32, 4),
134         FORMAT(R32G32B32A32_UINT, RGBA32UI,     RGBA32UI,    SWIZ_XYZW, 32, 4),
135 
136         FORMAT(A8_SINT,           R8I,          R8I,         SWIZ_000X, 16, 0),
137         FORMAT(A8_UINT,           R8UI,         R8UI,        SWIZ_000X, 16, 0),
138         FORMAT(A16_SINT,          R16I,         R16I,        SWIZ_000X, 16, 0),
139         FORMAT(A16_UINT,          R16UI,        R16UI,       SWIZ_000X, 16, 0),
140         FORMAT(A32_SINT,          R32I,         R32I,        SWIZ_000X, 32, 1),
141         FORMAT(A32_UINT,          R32UI,        R32UI,       SWIZ_000X, 32, 1),
142 
143         FORMAT(R11G11B10_FLOAT,   R11F_G11F_B10F, R11F_G11F_B10F, SWIZ_XYZW, 16, 0),
144         FORMAT(R9G9B9E5_FLOAT,    NO,           RGB9_E5,     SWIZ_XYZW, 16, 0),
145 
146 #if V3D_VERSION >= 40
147         FORMAT(S8_UINT_Z24_UNORM, D24S8,        DEPTH24_X8,  SWIZ_XXXX, 32, 1),
148         FORMAT(X8Z24_UNORM,       D24S8,        DEPTH24_X8,  SWIZ_XXXX, 32, 1),
149         FORMAT(S8X24_UINT,        S8,           R32F,        SWIZ_XXXX, 32, 1),
150         FORMAT(Z32_FLOAT,         D32F,         R32F,        SWIZ_XXXX, 32, 1),
151         FORMAT(Z16_UNORM,         D16,          DEPTH_COMP16,SWIZ_XXXX, 32, 1),
152 
153         /* Pretend we support this, but it'll be separate Z32F depth and S8. */
154         FORMAT(Z32_FLOAT_S8X24_UINT, D32F,      R32F,        SWIZ_XXXX, 32, 1),
155 #else
156         FORMAT(S8_UINT_Z24_UNORM, ZS_DEPTH24_STENCIL8, DEPTH24_X8, SWIZ_XXXX, 32, 1),
157         FORMAT(X8Z24_UNORM,       ZS_DEPTH24_STENCIL8, DEPTH24_X8, SWIZ_XXXX, 32, 1),
158         FORMAT(S8X24_UINT,        NO,           R32F,        SWIZ_XXXX, 32, 1),
159         FORMAT(Z32_FLOAT,         ZS_DEPTH_COMPONENT32F, R32F, SWIZ_XXXX, 32, 1),
160         FORMAT(Z16_UNORM,         ZS_DEPTH_COMPONENT16,  DEPTH_COMP16, SWIZ_XXXX, 32, 1),
161 
162         /* Pretend we support this, but it'll be separate Z32F depth and S8. */
163         FORMAT(Z32_FLOAT_S8X24_UINT, ZS_DEPTH_COMPONENT32F, R32F, SWIZ_XXXX, 32, 1),
164 #endif
165 
166         FORMAT(ETC2_RGB8,         NO,           RGB8_ETC2,   SWIZ_XYZ1, 16, 0),
167         FORMAT(ETC2_SRGB8,        NO,           RGB8_ETC2,   SWIZ_XYZ1, 16, 0),
168         FORMAT(ETC2_RGB8A1,       NO,           RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, 0),
169         FORMAT(ETC2_SRGB8A1,      NO,           RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, 0),
170         FORMAT(ETC2_RGBA8,        NO,           RGBA8_ETC2_EAC, SWIZ_XYZW, 16, 0),
171         FORMAT(ETC2_SRGBA8,       NO,           RGBA8_ETC2_EAC, SWIZ_XYZW, 16, 0),
172         FORMAT(ETC2_R11_UNORM,    NO,           R11_EAC,     SWIZ_X001, 16, 0),
173         FORMAT(ETC2_R11_SNORM,    NO,           SIGNED_R11_EAC, SWIZ_X001, 16, 0),
174         FORMAT(ETC2_RG11_UNORM,   NO,           RG11_EAC,    SWIZ_XY01, 16, 0),
175         FORMAT(ETC2_RG11_SNORM,   NO,           SIGNED_RG11_EAC, SWIZ_XY01, 16, 0),
176 
177         FORMAT(DXT1_RGB,          NO,           BC1,         SWIZ_XYZ1, 16, 0),
178         FORMAT(DXT3_RGBA,         NO,           BC2,         SWIZ_XYZ1, 16, 0),
179         FORMAT(DXT5_RGBA,         NO,           BC3,         SWIZ_XYZ1, 16, 0),
180 };
181 
182 const struct vc5_format *
v3dX(get_format_desc)183 v3dX(get_format_desc)(enum pipe_format f)
184 {
185         if (f < ARRAY_SIZE(format_table) && format_table[f].present)
186                 return &format_table[f];
187         else
188                 return NULL;
189 }
190 
191 void
v3dX(get_internal_type_bpp_for_output_format)192 v3dX(get_internal_type_bpp_for_output_format)(uint32_t format,
193                                               uint32_t *type,
194                                               uint32_t *bpp)
195 {
196         switch (format) {
197         case V3D_OUTPUT_IMAGE_FORMAT_RGBA8:
198 #if V3D_VERSION < 41
199         case V3D_OUTPUT_IMAGE_FORMAT_RGBX8:
200 #endif
201         case V3D_OUTPUT_IMAGE_FORMAT_RGB8:
202         case V3D_OUTPUT_IMAGE_FORMAT_RG8:
203         case V3D_OUTPUT_IMAGE_FORMAT_R8:
204         case V3D_OUTPUT_IMAGE_FORMAT_ABGR4444:
205         case V3D_OUTPUT_IMAGE_FORMAT_BGR565:
206         case V3D_OUTPUT_IMAGE_FORMAT_ABGR1555:
207                 *type = V3D_INTERNAL_TYPE_8;
208                 *bpp = V3D_INTERNAL_BPP_32;
209                 break;
210 
211         case V3D_OUTPUT_IMAGE_FORMAT_RGBA8I:
212         case V3D_OUTPUT_IMAGE_FORMAT_RG8I:
213         case V3D_OUTPUT_IMAGE_FORMAT_R8I:
214                 *type = V3D_INTERNAL_TYPE_8I;
215                 *bpp = V3D_INTERNAL_BPP_32;
216                 break;
217 
218         case V3D_OUTPUT_IMAGE_FORMAT_RGBA8UI:
219         case V3D_OUTPUT_IMAGE_FORMAT_RG8UI:
220         case V3D_OUTPUT_IMAGE_FORMAT_R8UI:
221                 *type = V3D_INTERNAL_TYPE_8UI;
222                 *bpp = V3D_INTERNAL_BPP_32;
223                 break;
224 
225         case V3D_OUTPUT_IMAGE_FORMAT_SRGB8_ALPHA8:
226         case V3D_OUTPUT_IMAGE_FORMAT_SRGB:
227         case V3D_OUTPUT_IMAGE_FORMAT_RGB10_A2:
228         case V3D_OUTPUT_IMAGE_FORMAT_R11F_G11F_B10F:
229 #if V3D_VERSION < 41
230         case V3D_OUTPUT_IMAGE_FORMAT_SRGBX8:
231 #endif
232         case V3D_OUTPUT_IMAGE_FORMAT_RGBA16F:
233                 /* Note that sRGB RTs are stored in the tile buffer at 16F,
234                  * and the conversion to sRGB happens at tilebuffer
235                  * load/store.
236                  */
237                 *type = V3D_INTERNAL_TYPE_16F;
238                 *bpp = V3D_INTERNAL_BPP_64;
239                 break;
240 
241         case V3D_OUTPUT_IMAGE_FORMAT_RG16F:
242         case V3D_OUTPUT_IMAGE_FORMAT_R16F:
243                 *type = V3D_INTERNAL_TYPE_16F;
244                 /* Use 64bpp to make sure the TLB doesn't throw away the alpha
245                  * channel before alpha test happens.
246                  */
247                 *bpp = V3D_INTERNAL_BPP_64;
248                 break;
249 
250         case V3D_OUTPUT_IMAGE_FORMAT_RGBA16I:
251                 *type = V3D_INTERNAL_TYPE_16I;
252                 *bpp = V3D_INTERNAL_BPP_64;
253                 break;
254         case V3D_OUTPUT_IMAGE_FORMAT_RG16I:
255         case V3D_OUTPUT_IMAGE_FORMAT_R16I:
256                 *type = V3D_INTERNAL_TYPE_16I;
257                 *bpp = V3D_INTERNAL_BPP_32;
258                 break;
259 
260         case V3D_OUTPUT_IMAGE_FORMAT_RGB10_A2UI:
261         case V3D_OUTPUT_IMAGE_FORMAT_RGBA16UI:
262                 *type = V3D_INTERNAL_TYPE_16UI;
263                 *bpp = V3D_INTERNAL_BPP_64;
264                 break;
265         case V3D_OUTPUT_IMAGE_FORMAT_RG16UI:
266         case V3D_OUTPUT_IMAGE_FORMAT_R16UI:
267                 *type = V3D_INTERNAL_TYPE_16UI;
268                 *bpp = V3D_INTERNAL_BPP_32;
269                 break;
270 
271         case V3D_OUTPUT_IMAGE_FORMAT_RGBA32I:
272                 *type = V3D_INTERNAL_TYPE_32I;
273                 *bpp = V3D_INTERNAL_BPP_128;
274                 break;
275         case V3D_OUTPUT_IMAGE_FORMAT_RG32I:
276                 *type = V3D_INTERNAL_TYPE_32I;
277                 *bpp = V3D_INTERNAL_BPP_64;
278                 break;
279         case V3D_OUTPUT_IMAGE_FORMAT_R32I:
280                 *type = V3D_INTERNAL_TYPE_32I;
281                 *bpp = V3D_INTERNAL_BPP_32;
282                 break;
283 
284         case V3D_OUTPUT_IMAGE_FORMAT_RGBA32UI:
285                 *type = V3D_INTERNAL_TYPE_32UI;
286                 *bpp = V3D_INTERNAL_BPP_128;
287                 break;
288         case V3D_OUTPUT_IMAGE_FORMAT_RG32UI:
289                 *type = V3D_INTERNAL_TYPE_32UI;
290                 *bpp = V3D_INTERNAL_BPP_64;
291                 break;
292         case V3D_OUTPUT_IMAGE_FORMAT_R32UI:
293                 *type = V3D_INTERNAL_TYPE_32UI;
294                 *bpp = V3D_INTERNAL_BPP_32;
295                 break;
296 
297         case V3D_OUTPUT_IMAGE_FORMAT_RGBA32F:
298                 *type = V3D_INTERNAL_TYPE_32F;
299                 *bpp = V3D_INTERNAL_BPP_128;
300                 break;
301         case V3D_OUTPUT_IMAGE_FORMAT_RG32F:
302                 *type = V3D_INTERNAL_TYPE_32F;
303                 *bpp = V3D_INTERNAL_BPP_64;
304                 break;
305         case V3D_OUTPUT_IMAGE_FORMAT_R32F:
306                 *type = V3D_INTERNAL_TYPE_32F;
307                 *bpp = V3D_INTERNAL_BPP_32;
308                 break;
309 
310         default:
311                 /* Provide some default values, as we'll be called at RB
312                  * creation time, even if an RB with this format isn't
313                  * supported.
314                  */
315                 *type = V3D_INTERNAL_TYPE_8;
316                 *bpp = V3D_INTERNAL_BPP_32;
317                 break;
318         }
319 }
320