1 /*
2  * Copyright © 2015 Intel Corporation
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21  * DEALINGS IN THE SOFTWARE.
22  */
23 
24 #include "tu_private.h"
25 
26 #include <assert.h>
27 #include <errno.h>
28 #include <stdarg.h>
29 #include <stdio.h>
30 #include <stdlib.h>
31 #include <string.h>
32 
33 #include "util/u_math.h"
34 #include "vk_enum_to_str.h"
35 
36 void PRINTFLIKE(3, 4)
__tu_finishme(const char * file,int line,const char * format,...)37    __tu_finishme(const char *file, int line, const char *format, ...)
38 {
39    va_list ap;
40    char buffer[256];
41 
42    va_start(ap, format);
43    vsnprintf(buffer, sizeof(buffer), format, ap);
44    va_end(ap);
45 
46    mesa_loge("%s:%d: FINISHME: %s\n", file, line, buffer);
47 }
48 
49 VkResult
__vk_errorf(struct tu_instance * instance,VkResult error,bool always_print,const char * file,int line,const char * format,...)50 __vk_errorf(struct tu_instance *instance,
51             VkResult error,
52             bool always_print,
53             const char *file,
54             int line,
55             const char *format,
56             ...)
57 {
58    va_list ap;
59    char buffer[256];
60 
61    const char *error_str = vk_Result_to_str(error);
62 
63 #ifndef DEBUG
64    if (!always_print)
65       return error;
66 #endif
67 
68    if (format) {
69       va_start(ap, format);
70       vsnprintf(buffer, sizeof(buffer), format, ap);
71       va_end(ap);
72 
73       mesa_loge("%s:%d: %s (%s)\n", file, line, buffer, error_str);
74    } else {
75       mesa_loge("%s:%d: %s\n", file, line, error_str);
76    }
77 
78    return error;
79 }
80 
81 static void
tu_tiling_config_update_tile_layout(struct tu_framebuffer * fb,const struct tu_device * dev,const struct tu_render_pass * pass)82 tu_tiling_config_update_tile_layout(struct tu_framebuffer *fb,
83                                     const struct tu_device *dev,
84                                     const struct tu_render_pass *pass)
85 {
86    const uint32_t tile_align_w = pass->tile_align_w;
87    const uint32_t tile_align_h = dev->physical_device->info.tile_align_h;
88    const uint32_t max_tile_width = 1024;
89 
90    /* start from 1 tile */
91    fb->tile_count = (VkExtent2D) {
92       .width = 1,
93       .height = 1,
94    };
95    fb->tile0 = (VkExtent2D) {
96       .width = util_align_npot(fb->width, tile_align_w),
97       .height = align(fb->height, tile_align_h),
98    };
99 
100    if (unlikely(dev->physical_device->instance->debug_flags & TU_DEBUG_FORCEBIN)) {
101       /* start with 2x2 tiles */
102       fb->tile_count.width = 2;
103       fb->tile_count.height = 2;
104       fb->tile0.width = util_align_npot(DIV_ROUND_UP(fb->width, 2), tile_align_w);
105       fb->tile0.height = align(DIV_ROUND_UP(fb->height, 2), tile_align_h);
106    }
107 
108    /* do not exceed max tile width */
109    while (fb->tile0.width > max_tile_width) {
110       fb->tile_count.width++;
111       fb->tile0.width =
112          util_align_npot(DIV_ROUND_UP(fb->width, fb->tile_count.width), tile_align_w);
113    }
114 
115    /* will force to sysmem, don't bother trying to have a valid tile config
116     * TODO: just skip all GMEM stuff when sysmem is forced?
117     */
118    if (!pass->gmem_pixels)
119       return;
120 
121    /* do not exceed gmem size */
122    while (fb->tile0.width * fb->tile0.height > pass->gmem_pixels) {
123       if (fb->tile0.width > MAX2(tile_align_w, fb->tile0.height)) {
124          fb->tile_count.width++;
125          fb->tile0.width =
126             util_align_npot(DIV_ROUND_UP(fb->width, fb->tile_count.width), tile_align_w);
127       } else {
128          /* if this assert fails then layout is impossible.. */
129          assert(fb->tile0.height > tile_align_h);
130          fb->tile_count.height++;
131          fb->tile0.height =
132             align(DIV_ROUND_UP(fb->height, fb->tile_count.height), tile_align_h);
133       }
134    }
135 }
136 
137 static void
tu_tiling_config_update_pipe_layout(struct tu_framebuffer * fb,const struct tu_device * dev)138 tu_tiling_config_update_pipe_layout(struct tu_framebuffer *fb,
139                                     const struct tu_device *dev)
140 {
141    const uint32_t max_pipe_count = 32; /* A6xx */
142 
143    /* start from 1 tile per pipe */
144    fb->pipe0 = (VkExtent2D) {
145       .width = 1,
146       .height = 1,
147    };
148    fb->pipe_count = fb->tile_count;
149 
150    while (fb->pipe_count.width * fb->pipe_count.height > max_pipe_count) {
151       if (fb->pipe0.width < fb->pipe0.height) {
152          fb->pipe0.width += 1;
153          fb->pipe_count.width =
154             DIV_ROUND_UP(fb->tile_count.width, fb->pipe0.width);
155       } else {
156          fb->pipe0.height += 1;
157          fb->pipe_count.height =
158             DIV_ROUND_UP(fb->tile_count.height, fb->pipe0.height);
159       }
160    }
161 }
162 
163 static void
tu_tiling_config_update_pipes(struct tu_framebuffer * fb,const struct tu_device * dev)164 tu_tiling_config_update_pipes(struct tu_framebuffer *fb,
165                               const struct tu_device *dev)
166 {
167    const uint32_t max_pipe_count = 32; /* A6xx */
168    const uint32_t used_pipe_count =
169       fb->pipe_count.width * fb->pipe_count.height;
170    const VkExtent2D last_pipe = {
171       .width = (fb->tile_count.width - 1) % fb->pipe0.width + 1,
172       .height = (fb->tile_count.height - 1) % fb->pipe0.height + 1,
173    };
174 
175    assert(used_pipe_count <= max_pipe_count);
176    assert(max_pipe_count <= ARRAY_SIZE(fb->pipe_config));
177 
178    for (uint32_t y = 0; y < fb->pipe_count.height; y++) {
179       for (uint32_t x = 0; x < fb->pipe_count.width; x++) {
180          const uint32_t pipe_x = fb->pipe0.width * x;
181          const uint32_t pipe_y = fb->pipe0.height * y;
182          const uint32_t pipe_w = (x == fb->pipe_count.width - 1)
183                                     ? last_pipe.width
184                                     : fb->pipe0.width;
185          const uint32_t pipe_h = (y == fb->pipe_count.height - 1)
186                                     ? last_pipe.height
187                                     : fb->pipe0.height;
188          const uint32_t n = fb->pipe_count.width * y + x;
189 
190          fb->pipe_config[n] = A6XX_VSC_PIPE_CONFIG_REG_X(pipe_x) |
191                                   A6XX_VSC_PIPE_CONFIG_REG_Y(pipe_y) |
192                                   A6XX_VSC_PIPE_CONFIG_REG_W(pipe_w) |
193                                   A6XX_VSC_PIPE_CONFIG_REG_H(pipe_h);
194          fb->pipe_sizes[n] = CP_SET_BIN_DATA5_0_VSC_SIZE(pipe_w * pipe_h);
195       }
196    }
197 
198    memset(fb->pipe_config + used_pipe_count, 0,
199           sizeof(uint32_t) * (max_pipe_count - used_pipe_count));
200 }
201 
202 void
tu_framebuffer_tiling_config(struct tu_framebuffer * fb,const struct tu_device * device,const struct tu_render_pass * pass)203 tu_framebuffer_tiling_config(struct tu_framebuffer *fb,
204                              const struct tu_device *device,
205                              const struct tu_render_pass *pass)
206 {
207    tu_tiling_config_update_tile_layout(fb, device, pass);
208    tu_tiling_config_update_pipe_layout(fb, device);
209    tu_tiling_config_update_pipes(fb, device);
210 }
211