1 /*
2  * Copyright © 2012 Intel Corporation
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21  * IN THE SOFTWARE.
22  */
23 
24 #ifndef BLORP_PRIV_H
25 #define BLORP_PRIV_H
26 
27 #include <stdint.h>
28 
29 #include "compiler/nir/nir.h"
30 #include "compiler/brw_compiler.h"
31 
32 #include "blorp.h"
33 
34 #ifdef __cplusplus
35 extern "C" {
36 #endif
37 
38 /**
39  * Binding table indices used by BLORP.
40  */
41 enum {
42    BLORP_RENDERBUFFER_BT_INDEX,
43    BLORP_TEXTURE_BT_INDEX,
44    BLORP_NUM_BT_ENTRIES
45 };
46 
47 struct brw_blorp_surface_info
48 {
49    bool enabled;
50 
51    struct isl_surf surf;
52    struct blorp_address addr;
53 
54    struct isl_surf aux_surf;
55    struct blorp_address aux_addr;
56    enum isl_aux_usage aux_usage;
57 
58    union isl_color_value clear_color;
59    struct blorp_address clear_color_addr;
60 
61    struct isl_view view;
62 
63    /* Z offset into a 3-D texture or slice of a 2-D array texture. */
64    uint32_t z_offset;
65 
66    uint32_t tile_x_sa, tile_y_sa;
67 };
68 
69 void
70 brw_blorp_surface_info_init(struct blorp_context *blorp,
71                             struct brw_blorp_surface_info *info,
72                             const struct blorp_surf *surf,
73                             unsigned int level, unsigned int layer,
74                             enum isl_format format, bool is_render_target);
75 void
76 blorp_surf_convert_to_single_slice(const struct isl_device *isl_dev,
77                                    struct brw_blorp_surface_info *info);
78 void
79 blorp_surf_convert_to_uncompressed(const struct isl_device *isl_dev,
80                                    struct brw_blorp_surface_info *info,
81                                    uint32_t *x, uint32_t *y,
82                                    uint32_t *width, uint32_t *height);
83 
84 
85 struct brw_blorp_coord_transform
86 {
87    float multiplier;
88    float offset;
89 };
90 
91 /**
92  * Bounding rectangle telling pixel discard which pixels are not to be
93  * touched. This is needed in when surfaces are configured as something else
94  * what they really are:
95  *
96  *    - writing W-tiled stencil as Y-tiled
97  *    - writing interleaved multisampled as single sampled.
98  *
99  * See blorp_nir_discard_if_outside_rect().
100  */
101 struct brw_blorp_discard_rect
102 {
103    uint32_t x0;
104    uint32_t x1;
105    uint32_t y0;
106    uint32_t y1;
107 };
108 
109 /**
110  * Grid needed for blended and scaled blits of integer formats, see
111  * blorp_nir_manual_blend_bilinear().
112  */
113 struct brw_blorp_rect_grid
114 {
115    float x1;
116    float y1;
117    float pad[2];
118 };
119 
120 struct blorp_surf_offset {
121    uint32_t x;
122    uint32_t y;
123 };
124 
125 struct brw_blorp_wm_inputs
126 {
127    uint32_t clear_color[4];
128 
129    struct brw_blorp_discard_rect discard_rect;
130    struct brw_blorp_rect_grid rect_grid;
131    struct brw_blorp_coord_transform coord_transform[2];
132 
133    struct blorp_surf_offset src_offset;
134    struct blorp_surf_offset dst_offset;
135 
136    /* (1/width, 1/height) for the source surface */
137    float src_inv_size[2];
138 
139    /* Minimum layer setting works for all the textures types but texture_3d
140     * for which the setting has no effect. Use the z-coordinate instead.
141     */
142    uint32_t src_z;
143 
144    /* Pad out to an integral number of registers */
145    uint32_t pad[1];
146 };
147 
148 #define BLORP_CREATE_NIR_INPUT(shader, name, type) ({ \
149    nir_variable *input = nir_variable_create((shader), nir_var_shader_in, \
150                                              type, #name); \
151    if ((shader)->info.stage == MESA_SHADER_FRAGMENT) \
152       input->data.interpolation = INTERP_MODE_FLAT; \
153    input->data.location = VARYING_SLOT_VAR0 + \
154       offsetof(struct brw_blorp_wm_inputs, name) / (4 * sizeof(float)); \
155    input->data.location_frac = \
156       (offsetof(struct brw_blorp_wm_inputs, name) / sizeof(float)) % 4; \
157    input; \
158 })
159 
160 struct blorp_vs_inputs {
161    uint32_t base_layer;
162    uint32_t _instance_id; /* Set in hardware by SGVS */
163    uint32_t pad[2];
164 };
165 
166 static inline unsigned
brw_blorp_get_urb_length(const struct brw_wm_prog_data * prog_data)167 brw_blorp_get_urb_length(const struct brw_wm_prog_data *prog_data)
168 {
169    if (prog_data == NULL)
170       return 1;
171 
172    /* From the BSpec: 3D Pipeline - Strips and Fans - 3DSTATE_SBE
173     *
174     * read_length = ceiling((max_source_attr+1)/2)
175     */
176    return MAX2((prog_data->num_varying_inputs + 1) / 2, 1);
177 }
178 
179 struct blorp_params
180 {
181    uint32_t x0;
182    uint32_t y0;
183    uint32_t x1;
184    uint32_t y1;
185    float z;
186    uint8_t stencil_mask;
187    uint8_t stencil_ref;
188    struct brw_blorp_surface_info depth;
189    struct brw_blorp_surface_info stencil;
190    uint32_t depth_format;
191    struct brw_blorp_surface_info src;
192    struct brw_blorp_surface_info dst;
193    enum blorp_hiz_op hiz_op;
194    bool full_surface_hiz_op;
195    enum blorp_fast_clear_op fast_clear_op;
196    bool color_write_disable[4];
197    struct brw_blorp_wm_inputs wm_inputs;
198    struct blorp_vs_inputs vs_inputs;
199    unsigned num_samples;
200    unsigned num_draw_buffers;
201    unsigned num_layers;
202    uint32_t vs_prog_kernel;
203    struct brw_vs_prog_data *vs_prog_data;
204    uint32_t sf_prog_kernel;
205    struct brw_sf_prog_data *sf_prog_data;
206    uint32_t wm_prog_kernel;
207    struct brw_wm_prog_data *wm_prog_data;
208 
209    bool use_pre_baked_binding_table;
210    uint32_t pre_baked_binding_table_offset;
211 };
212 
213 void blorp_params_init(struct blorp_params *params);
214 
215 enum blorp_shader_type {
216    BLORP_SHADER_TYPE_BLIT,
217    BLORP_SHADER_TYPE_CLEAR,
218    BLORP_SHADER_TYPE_MCS_PARTIAL_RESOLVE,
219    BLORP_SHADER_TYPE_LAYER_OFFSET_VS,
220    BLORP_SHADER_TYPE_GEN4_SF,
221 };
222 
223 struct brw_blorp_blit_prog_key
224 {
225    enum blorp_shader_type shader_type; /* Must be BLORP_SHADER_TYPE_BLIT */
226 
227    /* Number of samples per pixel that have been configured in the surface
228     * state for texturing from.
229     */
230    unsigned tex_samples;
231 
232    /* MSAA layout that has been configured in the surface state for texturing
233     * from.
234     */
235    enum isl_msaa_layout tex_layout;
236 
237    enum isl_aux_usage tex_aux_usage;
238 
239    /* Actual number of samples per pixel in the source image. */
240    unsigned src_samples;
241 
242    /* Actual MSAA layout used by the source image. */
243    enum isl_msaa_layout src_layout;
244 
245    /* Number of bits per channel in the source image. */
246    uint8_t src_bpc;
247 
248    /* True if the source requires normalized coordinates */
249    bool src_coords_normalized;
250 
251    /* Number of samples per pixel that have been configured in the render
252     * target.
253     */
254    unsigned rt_samples;
255 
256    /* MSAA layout that has been configured in the render target. */
257    enum isl_msaa_layout rt_layout;
258 
259    /* Actual number of samples per pixel in the destination image. */
260    unsigned dst_samples;
261 
262    /* Actual MSAA layout used by the destination image. */
263    enum isl_msaa_layout dst_layout;
264 
265    /* Number of bits per channel in the destination image. */
266    uint8_t dst_bpc;
267 
268    /* Type of the data to be read from the texture (one of
269     * nir_type_(int|uint|float)).
270     */
271    nir_alu_type texture_data_type;
272 
273    /* True if the source image is W tiled.  If true, the surface state for the
274     * source image must be configured as Y tiled, and tex_samples must be 0.
275     */
276    bool src_tiled_w;
277 
278    /* True if the destination image is W tiled.  If true, the surface state
279     * for the render target must be configured as Y tiled, and rt_samples must
280     * be 0.
281     */
282    bool dst_tiled_w;
283 
284    /* True if the destination is an RGB format.  If true, the surface state
285     * for the render target must be configured as red with three times the
286     * normal width.  We need to do this because you cannot render to
287     * non-power-of-two formats.
288     */
289    bool dst_rgb;
290 
291    /* True if all source samples should be blended together to produce each
292     * destination pixel.  If true, src_tiled_w must be false, tex_samples must
293     * equal src_samples, and tex_samples must be nonzero.
294     */
295    bool blend;
296 
297    /* True if the rectangle being sent through the rendering pipeline might be
298     * larger than the destination rectangle, so the WM program should kill any
299     * pixels that are outside the destination rectangle.
300     */
301    bool use_kill;
302 
303    /**
304     * True if the WM program should be run in MSDISPMODE_PERSAMPLE with more
305     * than one sample per pixel.
306     */
307    bool persample_msaa_dispatch;
308 
309    /* True for scaled blitting. */
310    bool blit_scaled;
311 
312    /* True if this blit operation may involve intratile offsets on the source.
313     * In this case, we need to add the offset before texturing.
314     */
315    bool need_src_offset;
316 
317    /* True if this blit operation may involve intratile offsets on the
318     * destination.  In this case, we need to add the offset to gl_FragCoord.
319     */
320    bool need_dst_offset;
321 
322    /* Scale factors between the pixel grid and the grid of samples. We're
323     * using grid of samples for bilinear filetring in multisample scaled blits.
324     */
325    float x_scale;
326    float y_scale;
327 
328    /* True for blits with filter = GL_LINEAR. */
329    bool bilinear_filter;
330 };
331 
332 /**
333  * \name BLORP internals
334  * \{
335  *
336  * Used internally by gen6_blorp_exec() and gen7_blorp_exec().
337  */
338 
339 void brw_blorp_init_wm_prog_key(struct brw_wm_prog_key *wm_key);
340 
341 const unsigned *
342 blorp_compile_fs(struct blorp_context *blorp, void *mem_ctx,
343                  struct nir_shader *nir,
344                  struct brw_wm_prog_key *wm_key,
345                  bool use_repclear,
346                  struct brw_wm_prog_data *wm_prog_data);
347 
348 const unsigned *
349 blorp_compile_vs(struct blorp_context *blorp, void *mem_ctx,
350                  struct nir_shader *nir,
351                  struct brw_vs_prog_data *vs_prog_data);
352 
353 bool
354 blorp_ensure_sf_program(struct blorp_context *blorp,
355                         struct blorp_params *params);
356 
357 /** \} */
358 
359 #ifdef __cplusplus
360 } /* end extern "C" */
361 #endif /* __cplusplus */
362 
363 #endif /* BLORP_PRIV_H */
364