1 /**************************************************************************
2  *
3  * Copyright 2006 Tungsten Graphics, Inc., Cedar Park, Texas.
4  * All Rights Reserved.
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a
7  * copy of this software and associated documentation files (the
8  * "Software"), to deal in the Software without restriction, including
9  * without limitation the rights to use, copy, modify, merge, publish,
10  * distribute, sub license, and/or sell copies of the Software, and to
11  * permit persons to whom the Software is furnished to do so, subject to
12  * the following conditions:
13  *
14  * The above copyright notice and this permission notice (including the
15  * next paragraph) shall be included in all copies or substantial portions
16  * of the Software.
17  *
18  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21  * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22  * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23  * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24  * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25  *
26  **************************************************************************/
27 
28 #ifndef INTEL_MIPMAP_TREE_H
29 #define INTEL_MIPMAP_TREE_H
30 
31 #include <assert.h>
32 
33 #include "intel_regions.h"
34 #include "intel_resolve_map.h"
35 
36 #ifdef __cplusplus
37 extern "C" {
38 #endif
39 
40 /* A layer on top of the intel_regions code which adds:
41  *
42  * - Code to size and layout a region to hold a set of mipmaps.
43  * - Query to determine if a new image fits in an existing tree.
44  * - More refcounting
45  *     - maybe able to remove refcounting from intel_region?
46  * - ?
47  *
48  * The fixed mipmap layout of intel hardware where one offset
49  * specifies the position of all images in a mipmap hierachy
50  * complicates the implementation of GL texture image commands,
51  * compared to hardware where each image is specified with an
52  * independent offset.
53  *
54  * In an ideal world, each texture object would be associated with a
55  * single bufmgr buffer or 2d intel_region, and all the images within
56  * the texture object would slot into the tree as they arrive.  The
57  * reality can be a little messier, as images can arrive from the user
58  * with sizes that don't fit in the existing tree, or in an order
59  * where the tree layout cannot be guessed immediately.
60  *
61  * This structure encodes an idealized mipmap tree.  The GL image
62  * commands build these where possible, otherwise store the images in
63  * temporary system buffers.
64  */
65 
66 struct intel_resolve_map;
67 struct intel_texture_image;
68 
69 struct intel_miptree_map {
70    /** Bitfield of GL_MAP_READ_BIT, GL_MAP_WRITE_BIT, GL_MAP_INVALIDATE_BIT */
71    GLbitfield mode;
72    /** Region of interest for the map. */
73    int x, y, w, h;
74    /** Possibly malloced temporary buffer for the mapping. */
75    void *buffer;
76    /** Possible pointer to a BO temporary for the mapping. */
77    drm_intel_bo *bo;
78    /** Pointer to the start of (map_x, map_y) returned by the mapping. */
79    void *ptr;
80    /** Stride of the mapping. */
81    int stride;
82 
83    /**
84     * intel_mipmap_tree::singlesample_mt is temporary storage that persists
85     * only for the duration of the map.
86     */
87    bool singlesample_mt_is_tmp;
88 };
89 
90 /**
91  * Describes the location of each texture image within a texture region.
92  */
93 struct intel_mipmap_level
94 {
95    /** Offset to this miptree level, used in computing x_offset. */
96    GLuint level_x;
97    /** Offset to this miptree level, used in computing y_offset. */
98    GLuint level_y;
99    GLuint width;
100    GLuint height;
101 
102    /**
103     * \brief Number of 2D slices in this miplevel.
104     *
105     * The exact semantics of depth varies according to the texture target:
106     *    - For GL_TEXTURE_CUBE_MAP, depth is 6.
107     *    - For GL_TEXTURE_2D_ARRAY, depth is the number of array slices. It is
108     *      identical for all miplevels in the texture.
109     *    - For GL_TEXTURE_3D, it is the texture's depth at this miplevel. Its
110     *      value, like width and height, varies with miplevel.
111     *    - For other texture types, depth is 1.
112     */
113    GLuint depth;
114 
115    /**
116     * \brief List of 2D images in this mipmap level.
117     *
118     * This may be a list of cube faces, array slices in 2D array texture, or
119     * layers in a 3D texture. The list's length is \c depth.
120     */
121    struct intel_mipmap_slice {
122       /**
123        * \name Offset to slice
124        * \{
125        *
126        * Hardware formats are so diverse that that there is no unified way to
127        * compute the slice offsets, so we store them in this table.
128        *
129        * The (x, y) offset to slice \c s at level \c l relative the miptrees
130        * base address is
131        * \code
132        *     x = mt->level[l].slice[s].x_offset
133        *     y = mt->level[l].slice[s].y_offset
134        */
135       GLuint x_offset;
136       GLuint y_offset;
137       /** \} */
138 
139       /**
140        * Mapping information. Persistent for the duration of
141        * intel_miptree_map/unmap on this slice.
142        */
143       struct intel_miptree_map *map;
144    } *slice;
145 };
146 
147 /**
148  * Enum for keeping track of the different MSAA layouts supported by Gen7.
149  */
150 enum intel_msaa_layout
151 {
152    /**
153     * Ordinary surface with no MSAA.
154     */
155    INTEL_MSAA_LAYOUT_NONE,
156 
157    /**
158     * Interleaved Multisample Surface.  The additional samples are
159     * accommodated by scaling up the width and the height of the surface so
160     * that all the samples corresponding to a pixel are located at nearby
161     * memory locations.
162     */
163    INTEL_MSAA_LAYOUT_IMS,
164 
165    /**
166     * Uncompressed Multisample Surface.  The surface is stored as a 2D array,
167     * with array slice n containing all pixel data for sample n.
168     */
169    INTEL_MSAA_LAYOUT_UMS,
170 
171    /**
172     * Compressed Multisample Surface.  The surface is stored as in
173     * INTEL_MSAA_LAYOUT_UMS, but there is an additional buffer called the MCS
174     * (Multisample Control Surface) buffer.  Each pixel in the MCS buffer
175     * indicates the mapping from sample number to array slice.  This allows
176     * the common case (where all samples constituting a pixel have the same
177     * color value) to be stored efficiently by just using a single array
178     * slice.
179     */
180    INTEL_MSAA_LAYOUT_CMS,
181 };
182 
183 struct intel_mipmap_tree
184 {
185    /* Effectively the key:
186     */
187    GLenum target;
188 
189    /**
190     * Generally, this is just the same as the gl_texture_image->TexFormat or
191     * gl_renderbuffer->Format.
192     *
193     * However, for textures and renderbuffers with packed depth/stencil formats
194     * on hardware where we want or need to use separate stencil, there will be
195     * two miptrees for storing the data.  If the depthstencil texture or rb is
196     * MESA_FORMAT_Z32_FLOAT_X24S8, then mt->format will be
197     * MESA_FORMAT_Z32_FLOAT, otherwise for MESA_FORMAT_S8_Z24 objects it will be
198     * MESA_FORMAT_X8_Z24.
199     *
200     * For ETC1 textures, this is MESA_FORMAT_RGBX8888_REV if the hardware
201     * lacks support for ETC1. See @ref wraps_etc1.
202     */
203    gl_format format;
204 
205    /**
206     * The X offset of each image in the miptree must be aligned to this. See
207     * the "Alignment Unit Size" section of the BSpec.
208     */
209    unsigned int align_w;
210    unsigned int align_h; /**< \see align_w */
211 
212    GLuint first_level;
213    GLuint last_level;
214 
215    GLuint width0, height0, depth0; /**< Level zero image dimensions */
216    GLuint cpp;
217    GLuint num_samples;
218    bool compressed;
219 
220    /**
221     * If num_samples > 0, then singlesample_width0 is the value that width0
222     * would have if instead a singlesample miptree were created. Note that,
223     * for non-interleaved msaa layouts, the two values are the same.
224     *
225     * If num_samples == 0, then singlesample_width0 is undefined.
226     */
227    uint32_t singlesample_width0;
228 
229    /** \see singlesample_width0 */
230    uint32_t singlesample_height0;
231 
232    /**
233     * For 1D array, 2D array, cube, and 2D multisampled surfaces on Gen7: true
234     * if the surface only contains LOD 0, and hence no space is for LOD's
235     * other than 0 in between array slices.
236     *
237     * Corresponds to the surface_array_spacing bit in gen7_surface_state.
238     */
239    bool array_spacing_lod0;
240 
241    /**
242     * MSAA layout used by this buffer.
243     */
244    enum intel_msaa_layout msaa_layout;
245 
246    /* Derived from the above:
247     */
248    GLuint total_width;
249    GLuint total_height;
250 
251    /* The 3DSTATE_CLEAR_PARAMS value associated with the last depth clear to
252     * this depth mipmap tree, if any.
253     */
254    uint32_t depth_clear_value;
255 
256    /* Includes image offset tables:
257     */
258    struct intel_mipmap_level level[MAX_TEXTURE_LEVELS];
259 
260    /* The data is held here:
261     */
262    struct intel_region *region;
263 
264    /* Offset into region bo where miptree starts:
265     */
266    uint32_t offset;
267 
268    /**
269     * \brief Singlesample miptree.
270     *
271     * This is used under two cases.
272     *
273     * --- Case 1: As persistent singlesample storage for multisample window
274     *  system front and back buffers ---
275     *
276     * Suppose that the window system FBO was created with a multisample
277     * config.  Let `back_irb` be the `intel_renderbuffer` for the FBO's back
278     * buffer. Then `back_irb` contains two miptrees: a parent multisample
279     * miptree (back_irb->mt) and a child singlesample miptree
280     * (back_irb->mt->singlesample_mt).  The DRM buffer shared with DRI2
281     * belongs to `back_irb->mt->singlesample_mt` and contains singlesample
282     * data.  The singlesample miptree is created at the same time as and
283     * persists for the lifetime of its parent multisample miptree.
284     *
285     * When access to the singlesample data is needed, such as at
286     * eglSwapBuffers and glReadPixels, an automatic downsample occurs from
287     * `back_rb->mt` to `back_rb->mt->singlesample_mt` when necessary.
288     *
289     * This description of the back buffer applies analogously to the front
290     * buffer.
291     *
292     *
293     * --- Case 2: As temporary singlesample storage for mapping multisample
294     *  miptrees ---
295     *
296     * Suppose the intel_miptree_map is called on a multisample miptree, `mt`,
297     * for which case 1 does not apply (that is, `mt` does not belong to
298     * a front or back buffer).  Then `mt->singlesample_mt` is null at the
299     * start of the call. intel_miptree_map will create a temporary
300     * singlesample miptree, store it at `mt->singlesample_mt`, downsample from
301     * `mt` to `mt->singlesample_mt` if necessary, then map
302     * `mt->singlesample_mt`. The temporary miptree is later deleted during
303     * intel_miptree_unmap.
304     */
305    struct intel_mipmap_tree *singlesample_mt;
306 
307    /**
308     * \brief A downsample is needed from this miptree to singlesample_mt.
309     */
310    bool need_downsample;
311 
312    /**
313     * \brief HiZ miptree
314     *
315     * This is non-null only if HiZ is enabled for this miptree.
316     *
317     * \see intel_miptree_alloc_hiz()
318     */
319    struct intel_mipmap_tree *hiz_mt;
320 
321    /**
322     * \brief Map of miptree slices to needed resolves.
323     *
324     * This is used only when the miptree has a child HiZ miptree.
325     *
326     * Let \c mt be a depth miptree with HiZ enabled. Then the resolve map is
327     * \c mt->hiz_map. The resolve map of the child HiZ miptree, \c
328     * mt->hiz_mt->hiz_map, is unused.
329     */
330    struct intel_resolve_map hiz_map;
331 
332    /**
333     * \brief Stencil miptree for depthstencil textures.
334     *
335     * This miptree is used for depthstencil textures and renderbuffers that
336     * require separate stencil.  It always has the true copy of the stencil
337     * bits, regardless of mt->format.
338     *
339     * \see intel_miptree_map_depthstencil()
340     * \see intel_miptree_unmap_depthstencil()
341     */
342    struct intel_mipmap_tree *stencil_mt;
343 
344    /**
345     * \brief MCS miptree for multisampled textures.
346     *
347     * This miptree contains the "multisample control surface", which stores
348     * the necessary information to implement compressed MSAA on Gen7+
349     * (INTEL_MSAA_FORMAT_CMS).
350     */
351    struct intel_mipmap_tree *mcs_mt;
352 
353    /**
354     * \brief The miptree contains RGBX data that was originally ETC1 data.
355     *
356     * On hardware that lacks support for ETC1 textures, we do the
357     * following on calls to glCompressedTexImage2D(GL_ETC1_RGB8_OES):
358     *   1. Create a miptree whose format is MESA_FORMAT_RGBX8888_REV with
359     *      the wraps_etc1 flag set.
360     *   2. Translate the ETC1 data into RGBX.
361     *   3. Store the RGBX data into the miptree and discard the ETC1 data.
362     */
363    bool wraps_etc1;
364 
365    /* These are also refcounted:
366     */
367    GLuint refcount;
368 };
369 
370 
371 
372 struct intel_mipmap_tree *intel_miptree_create(struct intel_context *intel,
373                                                GLenum target,
374 					       gl_format format,
375                                                GLuint first_level,
376                                                GLuint last_level,
377                                                GLuint width0,
378                                                GLuint height0,
379                                                GLuint depth0,
380 					       bool expect_accelerated_upload,
381                                                GLuint num_samples,
382                                                enum intel_msaa_layout msaa_layout);
383 
384 struct intel_mipmap_tree *
385 intel_miptree_create_for_region(struct intel_context *intel,
386 				GLenum target,
387 				gl_format format,
388 				struct intel_region *region);
389 
390 struct intel_mipmap_tree*
391 intel_miptree_create_for_dri2_buffer(struct intel_context *intel,
392                                      unsigned dri_attachment,
393                                      gl_format format,
394                                      uint32_t num_samples,
395                                      struct intel_region *region);
396 
397 /**
398  * Create a miptree appropriate as the storage for a non-texture renderbuffer.
399  * The miptree has the following properties:
400  *     - The target is GL_TEXTURE_2D.
401  *     - There are no levels other than the base level 0.
402  *     - Depth is 1.
403  */
404 struct intel_mipmap_tree*
405 intel_miptree_create_for_renderbuffer(struct intel_context *intel,
406                                       gl_format format,
407                                       uint32_t width,
408                                       uint32_t height,
409                                       uint32_t num_samples);
410 
411 /** \brief Assert that the level and layer are valid for the miptree. */
412 static inline void
intel_miptree_check_level_layer(struct intel_mipmap_tree * mt,uint32_t level,uint32_t layer)413 intel_miptree_check_level_layer(struct intel_mipmap_tree *mt,
414                                 uint32_t level,
415                                 uint32_t layer)
416 {
417    assert(level >= mt->first_level);
418    assert(level <= mt->last_level);
419    assert(layer < mt->level[level].depth);
420 }
421 
422 int intel_miptree_pitch_align (struct intel_context *intel,
423 			       struct intel_mipmap_tree *mt,
424 			       uint32_t tiling,
425 			       int pitch);
426 
427 void intel_miptree_reference(struct intel_mipmap_tree **dst,
428                              struct intel_mipmap_tree *src);
429 
430 void intel_miptree_release(struct intel_mipmap_tree **mt);
431 
432 /* Check if an image fits an existing mipmap tree layout
433  */
434 bool intel_miptree_match_image(struct intel_mipmap_tree *mt,
435                                     struct gl_texture_image *image);
436 
437 void
438 intel_miptree_get_image_offset(struct intel_mipmap_tree *mt,
439 			       GLuint level, GLuint face, GLuint depth,
440 			       GLuint *x, GLuint *y);
441 
442 void
443 intel_miptree_get_dimensions_for_image(struct gl_texture_image *image,
444                                        int *width, int *height, int *depth);
445 
446 void intel_miptree_set_level_info(struct intel_mipmap_tree *mt,
447                                   GLuint level,
448                                   GLuint x, GLuint y,
449                                   GLuint w, GLuint h, GLuint d);
450 
451 void intel_miptree_set_image_offset(struct intel_mipmap_tree *mt,
452                                     GLuint level,
453                                     GLuint img, GLuint x, GLuint y);
454 
455 void
456 intel_miptree_copy_teximage(struct intel_context *intel,
457                             struct intel_texture_image *intelImage,
458                             struct intel_mipmap_tree *dst_mt);
459 
460 /**
461  * Copy the stencil data from \c mt->stencil_mt->region to \c mt->region for
462  * the given miptree slice.
463  *
464  * \see intel_mipmap_tree::stencil_mt
465  */
466 void
467 intel_miptree_s8z24_scatter(struct intel_context *intel,
468                             struct intel_mipmap_tree *mt,
469                             uint32_t level,
470                             uint32_t slice);
471 
472 /**
473  * Copy the stencil data in \c mt->stencil_mt->region to \c mt->region for the
474  * given miptree slice.
475  *
476  * \see intel_mipmap_tree::stencil_mt
477  */
478 void
479 intel_miptree_s8z24_gather(struct intel_context *intel,
480                            struct intel_mipmap_tree *mt,
481                            uint32_t level,
482                            uint32_t layer);
483 
484 bool
485 intel_miptree_alloc_mcs(struct intel_context *intel,
486                         struct intel_mipmap_tree *mt,
487                         GLuint num_samples);
488 
489 /**
490  * \name Miptree HiZ functions
491  * \{
492  *
493  * It is safe to call the "slice_set_need_resolve" and "slice_resolve"
494  * functions on a miptree without HiZ. In that case, each function is a no-op.
495  */
496 
497 /**
498  * \brief Allocate the miptree's embedded HiZ miptree.
499  * \see intel_mipmap_tree:hiz_mt
500  * \return false if allocation failed
501  */
502 
503 bool
504 intel_miptree_alloc_hiz(struct intel_context *intel,
505 			struct intel_mipmap_tree *mt,
506                         GLuint num_samples);
507 
508 void
509 intel_miptree_slice_set_needs_hiz_resolve(struct intel_mipmap_tree *mt,
510                                           uint32_t level,
511 					  uint32_t depth);
512 void
513 intel_miptree_slice_set_needs_depth_resolve(struct intel_mipmap_tree *mt,
514                                             uint32_t level,
515 					    uint32_t depth);
516 void
517 intel_miptree_all_slices_set_need_hiz_resolve(struct intel_mipmap_tree *mt);
518 
519 void
520 intel_miptree_all_slices_set_need_depth_resolve(struct intel_mipmap_tree *mt);
521 
522 /**
523  * \return false if no resolve was needed
524  */
525 bool
526 intel_miptree_slice_resolve_hiz(struct intel_context *intel,
527 				struct intel_mipmap_tree *mt,
528 				unsigned int level,
529 				unsigned int depth);
530 
531 /**
532  * \return false if no resolve was needed
533  */
534 bool
535 intel_miptree_slice_resolve_depth(struct intel_context *intel,
536 				  struct intel_mipmap_tree *mt,
537 				  unsigned int level,
538 				  unsigned int depth);
539 
540 /**
541  * \return false if no resolve was needed
542  */
543 bool
544 intel_miptree_all_slices_resolve_hiz(struct intel_context *intel,
545 				     struct intel_mipmap_tree *mt);
546 
547 /**
548  * \return false if no resolve was needed
549  */
550 bool
551 intel_miptree_all_slices_resolve_depth(struct intel_context *intel,
552 				       struct intel_mipmap_tree *mt);
553 
554 /**\}*/
555 
556 void
557 intel_miptree_downsample(struct intel_context *intel,
558                          struct intel_mipmap_tree *mt);
559 
560 void
561 intel_miptree_upsample(struct intel_context *intel,
562                        struct intel_mipmap_tree *mt);
563 
564 /* i915_mipmap_tree.c:
565  */
566 void i915_miptree_layout(struct intel_mipmap_tree *mt);
567 void i945_miptree_layout(struct intel_mipmap_tree *mt);
568 void brw_miptree_layout(struct intel_context *intel,
569 			struct intel_mipmap_tree *mt);
570 
571 void
572 intel_miptree_map(struct intel_context *intel,
573 		  struct intel_mipmap_tree *mt,
574 		  unsigned int level,
575 		  unsigned int slice,
576 		  unsigned int x,
577 		  unsigned int y,
578 		  unsigned int w,
579 		  unsigned int h,
580 		  GLbitfield mode,
581 		  void **out_ptr,
582 		  int *out_stride);
583 
584 void
585 intel_miptree_unmap(struct intel_context *intel,
586 		    struct intel_mipmap_tree *mt,
587 		    unsigned int level,
588 		    unsigned int slice);
589 
590 #ifdef I915
591 static inline void
intel_hiz_exec(struct intel_context * intel,struct intel_mipmap_tree * mt,unsigned int level,unsigned int layer,enum gen6_hiz_op op)592 intel_hiz_exec(struct intel_context *intel, struct intel_mipmap_tree *mt,
593 	       unsigned int level, unsigned int layer, enum gen6_hiz_op op)
594 {
595    /* Stub on i915.  It would be nice if we didn't execute resolve code at all
596     * there.
597     */
598 }
599 #else
600 void
601 intel_hiz_exec(struct intel_context *intel, struct intel_mipmap_tree *mt,
602 	       unsigned int level, unsigned int layer, enum gen6_hiz_op op);
603 #endif
604 
605 #ifdef __cplusplus
606 }
607 #endif
608 
609 #endif
610