1 /*
2  * Copyright © 2011 Red Hat All Rights Reserved.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining
5  * a copy of this software and associated documentation files (the
6  * "Software"), to deal in the Software without restriction, including
7  * without limitation the rights to use, copy, modify, merge, publish,
8  * distribute, sub license, and/or sell copies of the Software, and to
9  * permit persons to whom the Software is furnished to do so, subject to
10  * the following conditions:
11  *
12  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
13  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
14  * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
15  * NON-INFRINGEMENT. IN NO EVENT SHALL THE COPYRIGHT HOLDERS, AUTHORS
16  * AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
17  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
18  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
19  * USE OR OTHER DEALINGS IN THE SOFTWARE.
20  *
21  * The above copyright notice and this permission notice (including the
22  * next paragraph) shall be included in all copies or substantial portions
23  * of the Software.
24  */
25 /*
26  * Authors:
27  *      Jérôme Glisse <jglisse@redhat.com>
28  */
29 #include <stdbool.h>
30 #include <assert.h>
31 #include <errno.h>
32 #include <stdio.h>
33 #include <stdlib.h>
34 #include <string.h>
35 #include <sys/ioctl.h>
36 #include "drm.h"
37 #include "libdrm_macros.h"
38 #include "xf86drm.h"
39 #include "radeon_drm.h"
40 #include "radeon_surface.h"
41 
42 #define CIK_TILE_MODE_COLOR_2D			14
43 #define CIK_TILE_MODE_COLOR_2D_SCANOUT		10
44 #define CIK_TILE_MODE_DEPTH_STENCIL_2D_TILESPLIT_64       0
45 #define CIK_TILE_MODE_DEPTH_STENCIL_2D_TILESPLIT_128      1
46 #define CIK_TILE_MODE_DEPTH_STENCIL_2D_TILESPLIT_256      2
47 #define CIK_TILE_MODE_DEPTH_STENCIL_2D_TILESPLIT_512      3
48 #define CIK_TILE_MODE_DEPTH_STENCIL_2D_TILESPLIT_ROW_SIZE 4
49 
50 #define ALIGN(value, alignment) (((value) + alignment - 1) & ~(alignment - 1))
51 #define MAX2(A, B)              ((A) > (B) ? (A) : (B))
52 #define MIN2(A, B)              ((A) < (B) ? (A) : (B))
53 
54 /* keep this private */
55 enum radeon_family {
56     CHIP_UNKNOWN,
57     CHIP_R600,
58     CHIP_RV610,
59     CHIP_RV630,
60     CHIP_RV670,
61     CHIP_RV620,
62     CHIP_RV635,
63     CHIP_RS780,
64     CHIP_RS880,
65     CHIP_RV770,
66     CHIP_RV730,
67     CHIP_RV710,
68     CHIP_RV740,
69     CHIP_CEDAR,
70     CHIP_REDWOOD,
71     CHIP_JUNIPER,
72     CHIP_CYPRESS,
73     CHIP_HEMLOCK,
74     CHIP_PALM,
75     CHIP_SUMO,
76     CHIP_SUMO2,
77     CHIP_BARTS,
78     CHIP_TURKS,
79     CHIP_CAICOS,
80     CHIP_CAYMAN,
81     CHIP_ARUBA,
82     CHIP_TAHITI,
83     CHIP_PITCAIRN,
84     CHIP_VERDE,
85     CHIP_OLAND,
86     CHIP_HAINAN,
87     CHIP_BONAIRE,
88     CHIP_KAVERI,
89     CHIP_KABINI,
90     CHIP_HAWAII,
91     CHIP_MULLINS,
92     CHIP_LAST,
93 };
94 
95 typedef int (*hw_init_surface_t)(struct radeon_surface_manager *surf_man,
96                                  struct radeon_surface *surf);
97 typedef int (*hw_best_surface_t)(struct radeon_surface_manager *surf_man,
98                                  struct radeon_surface *surf);
99 
100 struct radeon_hw_info {
101     /* apply to r6, eg */
102     uint32_t                        group_bytes;
103     uint32_t                        num_banks;
104     uint32_t                        num_pipes;
105     /* apply to eg */
106     uint32_t                        row_size;
107     unsigned                        allow_2d;
108     /* apply to si */
109     uint32_t                        tile_mode_array[32];
110     /* apply to cik */
111     uint32_t                        macrotile_mode_array[16];
112 };
113 
114 struct radeon_surface_manager {
115     int                         fd;
116     uint32_t                    device_id;
117     struct radeon_hw_info       hw_info;
118     unsigned                    family;
119     hw_init_surface_t           surface_init;
120     hw_best_surface_t           surface_best;
121 };
122 
123 /* helper */
radeon_get_value(int fd,unsigned req,uint32_t * value)124 static int radeon_get_value(int fd, unsigned req, uint32_t *value)
125 {
126     struct drm_radeon_info info = {};
127     int r;
128 
129     *value = 0;
130     info.request = req;
131     info.value = (uintptr_t)value;
132     r = drmCommandWriteRead(fd, DRM_RADEON_INFO, &info,
133                             sizeof(struct drm_radeon_info));
134     return r;
135 }
136 
radeon_get_family(struct radeon_surface_manager * surf_man)137 static int radeon_get_family(struct radeon_surface_manager *surf_man)
138 {
139     switch (surf_man->device_id) {
140 #define CHIPSET(pci_id, name, fam) case pci_id: surf_man->family = CHIP_##fam; break;
141 #include "r600_pci_ids.h"
142 #undef CHIPSET
143     default:
144         return -EINVAL;
145     }
146     return 0;
147 }
148 
next_power_of_two(unsigned x)149 static unsigned next_power_of_two(unsigned x)
150 {
151    if (x <= 1)
152        return 1;
153 
154    return (1 << ((sizeof(unsigned) * 8) - __builtin_clz(x - 1)));
155 }
156 
mip_minify(unsigned size,unsigned level)157 static unsigned mip_minify(unsigned size, unsigned level)
158 {
159     unsigned val;
160 
161     val = MAX2(1, size >> level);
162     if (level > 0)
163         val = next_power_of_two(val);
164     return val;
165 }
166 
surf_minify(struct radeon_surface * surf,struct radeon_surface_level * surflevel,unsigned bpe,unsigned level,uint32_t xalign,uint32_t yalign,uint32_t zalign,uint64_t offset)167 static void surf_minify(struct radeon_surface *surf,
168                         struct radeon_surface_level *surflevel,
169                         unsigned bpe, unsigned level,
170                         uint32_t xalign, uint32_t yalign, uint32_t zalign,
171                         uint64_t offset)
172 {
173     surflevel->npix_x = mip_minify(surf->npix_x, level);
174     surflevel->npix_y = mip_minify(surf->npix_y, level);
175     surflevel->npix_z = mip_minify(surf->npix_z, level);
176     surflevel->nblk_x = (surflevel->npix_x + surf->blk_w - 1) / surf->blk_w;
177     surflevel->nblk_y = (surflevel->npix_y + surf->blk_h - 1) / surf->blk_h;
178     surflevel->nblk_z = (surflevel->npix_z + surf->blk_d - 1) / surf->blk_d;
179     if (surf->nsamples == 1 && surflevel->mode == RADEON_SURF_MODE_2D &&
180         !(surf->flags & RADEON_SURF_FMASK)) {
181         if (surflevel->nblk_x < xalign || surflevel->nblk_y < yalign) {
182             surflevel->mode = RADEON_SURF_MODE_1D;
183             return;
184         }
185     }
186     surflevel->nblk_x  = ALIGN(surflevel->nblk_x, xalign);
187     surflevel->nblk_y  = ALIGN(surflevel->nblk_y, yalign);
188     surflevel->nblk_z  = ALIGN(surflevel->nblk_z, zalign);
189 
190     surflevel->offset = offset;
191     surflevel->pitch_bytes = surflevel->nblk_x * bpe * surf->nsamples;
192     surflevel->slice_size = (uint64_t)surflevel->pitch_bytes * surflevel->nblk_y;
193 
194     surf->bo_size = offset + surflevel->slice_size * surflevel->nblk_z * surf->array_size;
195 }
196 
197 /* ===========================================================================
198  * r600/r700 family
199  */
r6_init_hw_info(struct radeon_surface_manager * surf_man)200 static int r6_init_hw_info(struct radeon_surface_manager *surf_man)
201 {
202     uint32_t tiling_config;
203     drmVersionPtr version;
204     int r;
205 
206     r = radeon_get_value(surf_man->fd, RADEON_INFO_TILING_CONFIG,
207                          &tiling_config);
208     if (r) {
209         return r;
210     }
211 
212     surf_man->hw_info.allow_2d = 0;
213     version = drmGetVersion(surf_man->fd);
214     if (version && version->version_minor >= 14) {
215         surf_man->hw_info.allow_2d = 1;
216     }
217     drmFreeVersion(version);
218 
219     switch ((tiling_config & 0xe) >> 1) {
220     case 0:
221         surf_man->hw_info.num_pipes = 1;
222         break;
223     case 1:
224         surf_man->hw_info.num_pipes = 2;
225         break;
226     case 2:
227         surf_man->hw_info.num_pipes = 4;
228         break;
229     case 3:
230         surf_man->hw_info.num_pipes = 8;
231         break;
232     default:
233         surf_man->hw_info.num_pipes = 8;
234         surf_man->hw_info.allow_2d = 0;
235         break;
236     }
237 
238     switch ((tiling_config & 0x30) >> 4) {
239     case 0:
240         surf_man->hw_info.num_banks = 4;
241         break;
242     case 1:
243         surf_man->hw_info.num_banks = 8;
244         break;
245     default:
246         surf_man->hw_info.num_banks = 8;
247         surf_man->hw_info.allow_2d = 0;
248         break;
249     }
250 
251     switch ((tiling_config & 0xc0) >> 6) {
252     case 0:
253         surf_man->hw_info.group_bytes = 256;
254         break;
255     case 1:
256         surf_man->hw_info.group_bytes = 512;
257         break;
258     default:
259         surf_man->hw_info.group_bytes = 256;
260         surf_man->hw_info.allow_2d = 0;
261         break;
262     }
263     return 0;
264 }
265 
r6_surface_init_linear(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,uint64_t offset,unsigned start_level)266 static int r6_surface_init_linear(struct radeon_surface_manager *surf_man,
267                                   struct radeon_surface *surf,
268                                   uint64_t offset, unsigned start_level)
269 {
270     uint32_t xalign, yalign, zalign;
271     unsigned i;
272 
273     /* compute alignment */
274     if (!start_level) {
275         surf->bo_alignment = MAX2(256, surf_man->hw_info.group_bytes);
276     }
277     /* the 32 alignment is for scanout, cb or db but to allow texture to be
278      * easily bound as such we force this alignment to all surface
279      */
280     xalign = MAX2(1, surf_man->hw_info.group_bytes / surf->bpe);
281     yalign = 1;
282     zalign = 1;
283     if (surf->flags & RADEON_SURF_SCANOUT) {
284         xalign = MAX2((surf->bpe == 1) ? 64 : 32, xalign);
285     }
286 
287     /* build mipmap tree */
288     for (i = start_level; i <= surf->last_level; i++) {
289         surf->level[i].mode = RADEON_SURF_MODE_LINEAR;
290         surf_minify(surf, surf->level+i, surf->bpe, i, xalign, yalign, zalign, offset);
291         /* level0 and first mipmap need to have alignment */
292         offset = surf->bo_size;
293         if (i == 0) {
294             offset = ALIGN(offset, surf->bo_alignment);
295         }
296     }
297     return 0;
298 }
299 
r6_surface_init_linear_aligned(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,uint64_t offset,unsigned start_level)300 static int r6_surface_init_linear_aligned(struct radeon_surface_manager *surf_man,
301                                           struct radeon_surface *surf,
302                                           uint64_t offset, unsigned start_level)
303 {
304     uint32_t xalign, yalign, zalign;
305     unsigned i;
306 
307     /* compute alignment */
308     if (!start_level) {
309         surf->bo_alignment = MAX2(256, surf_man->hw_info.group_bytes);
310     }
311     xalign = MAX2(64, surf_man->hw_info.group_bytes / surf->bpe);
312     yalign = 1;
313     zalign = 1;
314 
315     /* build mipmap tree */
316     for (i = start_level; i <= surf->last_level; i++) {
317         surf->level[i].mode = RADEON_SURF_MODE_LINEAR_ALIGNED;
318         surf_minify(surf, surf->level+i, surf->bpe, i, xalign, yalign, zalign, offset);
319         /* level0 and first mipmap need to have alignment */
320         offset = surf->bo_size;
321         if (i == 0) {
322             offset = ALIGN(offset, surf->bo_alignment);
323         }
324     }
325     return 0;
326 }
327 
r6_surface_init_1d(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,uint64_t offset,unsigned start_level)328 static int r6_surface_init_1d(struct radeon_surface_manager *surf_man,
329                               struct radeon_surface *surf,
330                               uint64_t offset, unsigned start_level)
331 {
332     uint32_t xalign, yalign, zalign, tilew;
333     unsigned i;
334 
335     /* compute alignment */
336     tilew = 8;
337     xalign = surf_man->hw_info.group_bytes / (tilew * surf->bpe * surf->nsamples);
338     xalign = MAX2(tilew, xalign);
339     yalign = tilew;
340     zalign = 1;
341     if (surf->flags & RADEON_SURF_SCANOUT) {
342         xalign = MAX2((surf->bpe == 1) ? 64 : 32, xalign);
343     }
344     if (!start_level) {
345         surf->bo_alignment = MAX2(256, surf_man->hw_info.group_bytes);
346     }
347 
348     /* build mipmap tree */
349     for (i = start_level; i <= surf->last_level; i++) {
350         surf->level[i].mode = RADEON_SURF_MODE_1D;
351         surf_minify(surf, surf->level+i, surf->bpe, i, xalign, yalign, zalign, offset);
352         /* level0 and first mipmap need to have alignment */
353         offset = surf->bo_size;
354         if (i == 0) {
355             offset = ALIGN(offset, surf->bo_alignment);
356         }
357     }
358     return 0;
359 }
360 
r6_surface_init_2d(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,uint64_t offset,unsigned start_level)361 static int r6_surface_init_2d(struct radeon_surface_manager *surf_man,
362                               struct radeon_surface *surf,
363                               uint64_t offset, unsigned start_level)
364 {
365     uint32_t xalign, yalign, zalign, tilew;
366     unsigned i;
367 
368     /* compute alignment */
369     tilew = 8;
370     zalign = 1;
371     xalign = (surf_man->hw_info.group_bytes * surf_man->hw_info.num_banks) /
372              (tilew * surf->bpe * surf->nsamples);
373     xalign = MAX2(tilew * surf_man->hw_info.num_banks, xalign);
374     if (surf->flags & RADEON_SURF_FMASK)
375 	xalign = MAX2(128, xalign);
376     yalign = tilew * surf_man->hw_info.num_pipes;
377     if (surf->flags & RADEON_SURF_SCANOUT) {
378         xalign = MAX2((surf->bpe == 1) ? 64 : 32, xalign);
379     }
380     if (!start_level) {
381         surf->bo_alignment =
382             MAX2(surf_man->hw_info.num_pipes *
383                  surf_man->hw_info.num_banks *
384                  surf->nsamples * surf->bpe * 64,
385                  xalign * yalign * surf->nsamples * surf->bpe);
386     }
387 
388     /* build mipmap tree */
389     for (i = start_level; i <= surf->last_level; i++) {
390         surf->level[i].mode = RADEON_SURF_MODE_2D;
391         surf_minify(surf, surf->level+i, surf->bpe, i, xalign, yalign, zalign, offset);
392         if (surf->level[i].mode == RADEON_SURF_MODE_1D) {
393             return r6_surface_init_1d(surf_man, surf, offset, i);
394         }
395         /* level0 and first mipmap need to have alignment */
396         offset = surf->bo_size;
397         if (i == 0) {
398             offset = ALIGN(offset, surf->bo_alignment);
399         }
400     }
401     return 0;
402 }
403 
r6_surface_init(struct radeon_surface_manager * surf_man,struct radeon_surface * surf)404 static int r6_surface_init(struct radeon_surface_manager *surf_man,
405                            struct radeon_surface *surf)
406 {
407     unsigned mode;
408     int r;
409 
410     /* MSAA surfaces support the 2D mode only. */
411     if (surf->nsamples > 1) {
412         surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
413         surf->flags |= RADEON_SURF_SET(RADEON_SURF_MODE_2D, MODE);
414     }
415 
416     /* tiling mode */
417     mode = (surf->flags >> RADEON_SURF_MODE_SHIFT) & RADEON_SURF_MODE_MASK;
418 
419     if (surf->flags & (RADEON_SURF_ZBUFFER | RADEON_SURF_SBUFFER)) {
420         /* zbuffer only support 1D or 2D tiled surface */
421         switch (mode) {
422         case RADEON_SURF_MODE_1D:
423         case RADEON_SURF_MODE_2D:
424             break;
425         default:
426             mode = RADEON_SURF_MODE_1D;
427             surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
428             surf->flags |= RADEON_SURF_SET(RADEON_SURF_MODE_1D, MODE);
429             break;
430         }
431     }
432 
433     /* force 1d on kernel that can't do 2d */
434     if (!surf_man->hw_info.allow_2d && mode > RADEON_SURF_MODE_1D) {
435         if (surf->nsamples > 1) {
436             fprintf(stderr, "radeon: Cannot use 2D tiling for an MSAA surface (%i).\n", __LINE__);
437             return -EFAULT;
438         }
439         mode = RADEON_SURF_MODE_1D;
440         surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
441         surf->flags |= RADEON_SURF_SET(mode, MODE);
442     }
443 
444     /* check surface dimension */
445     if (surf->npix_x > 8192 || surf->npix_y > 8192 || surf->npix_z > 8192) {
446         return -EINVAL;
447     }
448 
449     /* check mipmap last_level */
450     if (surf->last_level > 14) {
451         return -EINVAL;
452     }
453 
454     /* check tiling mode */
455     switch (mode) {
456     case RADEON_SURF_MODE_LINEAR:
457         r = r6_surface_init_linear(surf_man, surf, 0, 0);
458         break;
459     case RADEON_SURF_MODE_LINEAR_ALIGNED:
460         r = r6_surface_init_linear_aligned(surf_man, surf, 0, 0);
461         break;
462     case RADEON_SURF_MODE_1D:
463         r = r6_surface_init_1d(surf_man, surf, 0, 0);
464         break;
465     case RADEON_SURF_MODE_2D:
466         r = r6_surface_init_2d(surf_man, surf, 0, 0);
467         break;
468     default:
469         return -EINVAL;
470     }
471     return r;
472 }
473 
r6_surface_best(struct radeon_surface_manager * surf_man,struct radeon_surface * surf)474 static int r6_surface_best(struct radeon_surface_manager *surf_man,
475                            struct radeon_surface *surf)
476 {
477     /* no value to optimize for r6xx/r7xx */
478     return 0;
479 }
480 
481 
482 /* ===========================================================================
483  * evergreen family
484  */
eg_init_hw_info(struct radeon_surface_manager * surf_man)485 static int eg_init_hw_info(struct radeon_surface_manager *surf_man)
486 {
487     uint32_t tiling_config;
488     drmVersionPtr version;
489     int r;
490 
491     r = radeon_get_value(surf_man->fd, RADEON_INFO_TILING_CONFIG,
492                          &tiling_config);
493     if (r) {
494         return r;
495     }
496 
497     surf_man->hw_info.allow_2d = 0;
498     version = drmGetVersion(surf_man->fd);
499     if (version && version->version_minor >= 16) {
500         surf_man->hw_info.allow_2d = 1;
501     }
502     drmFreeVersion(version);
503 
504     switch (tiling_config & 0xf) {
505     case 0:
506         surf_man->hw_info.num_pipes = 1;
507         break;
508     case 1:
509         surf_man->hw_info.num_pipes = 2;
510         break;
511     case 2:
512         surf_man->hw_info.num_pipes = 4;
513         break;
514     case 3:
515         surf_man->hw_info.num_pipes = 8;
516         break;
517     default:
518         surf_man->hw_info.num_pipes = 8;
519         surf_man->hw_info.allow_2d = 0;
520         break;
521     }
522 
523     switch ((tiling_config & 0xf0) >> 4) {
524     case 0:
525         surf_man->hw_info.num_banks = 4;
526         break;
527     case 1:
528         surf_man->hw_info.num_banks = 8;
529         break;
530     case 2:
531         surf_man->hw_info.num_banks = 16;
532         break;
533     default:
534         surf_man->hw_info.num_banks = 8;
535         surf_man->hw_info.allow_2d = 0;
536         break;
537     }
538 
539     switch ((tiling_config & 0xf00) >> 8) {
540     case 0:
541         surf_man->hw_info.group_bytes = 256;
542         break;
543     case 1:
544         surf_man->hw_info.group_bytes = 512;
545         break;
546     default:
547         surf_man->hw_info.group_bytes = 256;
548         surf_man->hw_info.allow_2d = 0;
549         break;
550     }
551 
552     switch ((tiling_config & 0xf000) >> 12) {
553     case 0:
554         surf_man->hw_info.row_size = 1024;
555         break;
556     case 1:
557         surf_man->hw_info.row_size = 2048;
558         break;
559     case 2:
560         surf_man->hw_info.row_size = 4096;
561         break;
562     default:
563         surf_man->hw_info.row_size = 4096;
564         surf_man->hw_info.allow_2d = 0;
565         break;
566     }
567     return 0;
568 }
569 
eg_surf_minify(struct radeon_surface * surf,struct radeon_surface_level * surflevel,unsigned bpe,unsigned level,unsigned slice_pt,unsigned mtilew,unsigned mtileh,unsigned mtileb,uint64_t offset)570 static void eg_surf_minify(struct radeon_surface *surf,
571                            struct radeon_surface_level *surflevel,
572                            unsigned bpe,
573                            unsigned level,
574                            unsigned slice_pt,
575                            unsigned mtilew,
576                            unsigned mtileh,
577                            unsigned mtileb,
578                            uint64_t offset)
579 {
580     unsigned mtile_pr, mtile_ps;
581 
582     surflevel->npix_x = mip_minify(surf->npix_x, level);
583     surflevel->npix_y = mip_minify(surf->npix_y, level);
584     surflevel->npix_z = mip_minify(surf->npix_z, level);
585     surflevel->nblk_x = (surflevel->npix_x + surf->blk_w - 1) / surf->blk_w;
586     surflevel->nblk_y = (surflevel->npix_y + surf->blk_h - 1) / surf->blk_h;
587     surflevel->nblk_z = (surflevel->npix_z + surf->blk_d - 1) / surf->blk_d;
588     if (surf->nsamples == 1 && surflevel->mode == RADEON_SURF_MODE_2D &&
589         !(surf->flags & RADEON_SURF_FMASK)) {
590         if (surflevel->nblk_x < mtilew || surflevel->nblk_y < mtileh) {
591             surflevel->mode = RADEON_SURF_MODE_1D;
592             return;
593         }
594     }
595     surflevel->nblk_x  = ALIGN(surflevel->nblk_x, mtilew);
596     surflevel->nblk_y  = ALIGN(surflevel->nblk_y, mtileh);
597     surflevel->nblk_z  = ALIGN(surflevel->nblk_z, 1);
598 
599     /* macro tile per row */
600     mtile_pr = surflevel->nblk_x / mtilew;
601     /* macro tile per slice */
602     mtile_ps = (mtile_pr * surflevel->nblk_y) / mtileh;
603 
604     surflevel->offset = offset;
605     surflevel->pitch_bytes = surflevel->nblk_x * bpe * surf->nsamples;
606     surflevel->slice_size = (uint64_t)mtile_ps * mtileb * slice_pt;
607 
608     surf->bo_size = offset + surflevel->slice_size * surflevel->nblk_z * surf->array_size;
609 }
610 
eg_surface_init_1d(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,struct radeon_surface_level * level,unsigned bpe,uint64_t offset,unsigned start_level)611 static int eg_surface_init_1d(struct radeon_surface_manager *surf_man,
612                               struct radeon_surface *surf,
613                               struct radeon_surface_level *level,
614                               unsigned bpe,
615                               uint64_t offset, unsigned start_level)
616 {
617     uint32_t xalign, yalign, zalign, tilew;
618     unsigned i;
619 
620     /* compute alignment */
621     tilew = 8;
622     xalign = surf_man->hw_info.group_bytes / (tilew * bpe * surf->nsamples);
623     xalign = MAX2(tilew, xalign);
624     yalign = tilew;
625     zalign = 1;
626     if (surf->flags & RADEON_SURF_SCANOUT) {
627         xalign = MAX2((bpe == 1) ? 64 : 32, xalign);
628     }
629 
630     if (!start_level) {
631         unsigned alignment = MAX2(256, surf_man->hw_info.group_bytes);
632         surf->bo_alignment = MAX2(surf->bo_alignment, alignment);
633 
634         if (offset) {
635             offset = ALIGN(offset, alignment);
636         }
637     }
638 
639     /* build mipmap tree */
640     for (i = start_level; i <= surf->last_level; i++) {
641         level[i].mode = RADEON_SURF_MODE_1D;
642         surf_minify(surf, level+i, bpe, i, xalign, yalign, zalign, offset);
643         /* level0 and first mipmap need to have alignment */
644         offset = surf->bo_size;
645         if (i == 0) {
646             offset = ALIGN(offset, surf->bo_alignment);
647         }
648     }
649     return 0;
650 }
651 
eg_surface_init_2d(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,struct radeon_surface_level * level,unsigned bpe,unsigned tile_split,uint64_t offset,unsigned start_level)652 static int eg_surface_init_2d(struct radeon_surface_manager *surf_man,
653                               struct radeon_surface *surf,
654                               struct radeon_surface_level *level,
655                               unsigned bpe, unsigned tile_split,
656                               uint64_t offset, unsigned start_level)
657 {
658     unsigned tilew, tileh, tileb;
659     unsigned mtilew, mtileh, mtileb;
660     unsigned slice_pt;
661     unsigned i;
662 
663     /* compute tile values */
664     tilew = 8;
665     tileh = 8;
666     tileb = tilew * tileh * bpe * surf->nsamples;
667     /* slices per tile */
668     slice_pt = 1;
669     if (tileb > tile_split && tile_split) {
670         slice_pt = tileb / tile_split;
671     }
672     tileb = tileb / slice_pt;
673 
674     /* macro tile width & height */
675     mtilew = (tilew * surf->bankw * surf_man->hw_info.num_pipes) * surf->mtilea;
676     mtileh = (tileh * surf->bankh * surf_man->hw_info.num_banks) / surf->mtilea;
677     /* macro tile bytes */
678     mtileb = (mtilew / tilew) * (mtileh / tileh) * tileb;
679 
680     if (!start_level) {
681         unsigned alignment = MAX2(256, mtileb);
682         surf->bo_alignment = MAX2(surf->bo_alignment, alignment);
683 
684         if (offset) {
685             offset = ALIGN(offset, alignment);
686         }
687     }
688 
689     /* build mipmap tree */
690     for (i = start_level; i <= surf->last_level; i++) {
691         level[i].mode = RADEON_SURF_MODE_2D;
692         eg_surf_minify(surf, level+i, bpe, i, slice_pt, mtilew, mtileh, mtileb, offset);
693         if (level[i].mode == RADEON_SURF_MODE_1D) {
694             return eg_surface_init_1d(surf_man, surf, level, bpe, offset, i);
695         }
696         /* level0 and first mipmap need to have alignment */
697         offset = surf->bo_size;
698         if (i == 0) {
699             offset = ALIGN(offset, surf->bo_alignment);
700         }
701     }
702     return 0;
703 }
704 
eg_surface_sanity(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,unsigned mode)705 static int eg_surface_sanity(struct radeon_surface_manager *surf_man,
706                              struct radeon_surface *surf,
707                              unsigned mode)
708 {
709     unsigned tileb;
710 
711     /* check surface dimension */
712     if (surf->npix_x > 16384 || surf->npix_y > 16384 || surf->npix_z > 16384) {
713         return -EINVAL;
714     }
715 
716     /* check mipmap last_level */
717     if (surf->last_level > 15) {
718         return -EINVAL;
719     }
720 
721     /* force 1d on kernel that can't do 2d */
722     if (!surf_man->hw_info.allow_2d && mode > RADEON_SURF_MODE_1D) {
723         if (surf->nsamples > 1) {
724             fprintf(stderr, "radeon: Cannot use 2D tiling for an MSAA surface (%i).\n", __LINE__);
725             return -EFAULT;
726         }
727         mode = RADEON_SURF_MODE_1D;
728         surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
729         surf->flags |= RADEON_SURF_SET(mode, MODE);
730     }
731 
732     /* check tile split */
733     if (mode == RADEON_SURF_MODE_2D) {
734         switch (surf->tile_split) {
735         case 64:
736         case 128:
737         case 256:
738         case 512:
739         case 1024:
740         case 2048:
741         case 4096:
742             break;
743         default:
744             return -EINVAL;
745         }
746         switch (surf->mtilea) {
747         case 1:
748         case 2:
749         case 4:
750         case 8:
751             break;
752         default:
753             return -EINVAL;
754         }
755         /* check aspect ratio */
756         if (surf_man->hw_info.num_banks < surf->mtilea) {
757             return -EINVAL;
758         }
759         /* check bank width */
760         switch (surf->bankw) {
761         case 1:
762         case 2:
763         case 4:
764         case 8:
765             break;
766         default:
767             return -EINVAL;
768         }
769         /* check bank height */
770         switch (surf->bankh) {
771         case 1:
772         case 2:
773         case 4:
774         case 8:
775             break;
776         default:
777             return -EINVAL;
778         }
779         tileb = MIN2(surf->tile_split, 64 * surf->bpe * surf->nsamples);
780         if ((tileb * surf->bankh * surf->bankw) < surf_man->hw_info.group_bytes) {
781             return -EINVAL;
782         }
783     }
784 
785     return 0;
786 }
787 
eg_surface_init_1d_miptrees(struct radeon_surface_manager * surf_man,struct radeon_surface * surf)788 static int eg_surface_init_1d_miptrees(struct radeon_surface_manager *surf_man,
789                                        struct radeon_surface *surf)
790 {
791     unsigned zs_flags = RADEON_SURF_ZBUFFER | RADEON_SURF_SBUFFER;
792     int r, is_depth_stencil = (surf->flags & zs_flags) == zs_flags;
793     /* Old libdrm_macros.headers didn't have stencil_level in it. This prevents crashes. */
794     struct radeon_surface_level tmp[RADEON_SURF_MAX_LEVEL];
795     struct radeon_surface_level *stencil_level =
796         (surf->flags & RADEON_SURF_HAS_SBUFFER_MIPTREE) ? surf->stencil_level : tmp;
797 
798     r = eg_surface_init_1d(surf_man, surf, surf->level, surf->bpe, 0, 0);
799     if (r)
800         return r;
801 
802     if (is_depth_stencil) {
803         r = eg_surface_init_1d(surf_man, surf, stencil_level, 1,
804                                surf->bo_size, 0);
805         surf->stencil_offset = stencil_level[0].offset;
806     }
807     return r;
808 }
809 
eg_surface_init_2d_miptrees(struct radeon_surface_manager * surf_man,struct radeon_surface * surf)810 static int eg_surface_init_2d_miptrees(struct radeon_surface_manager *surf_man,
811                                        struct radeon_surface *surf)
812 {
813     unsigned zs_flags = RADEON_SURF_ZBUFFER | RADEON_SURF_SBUFFER;
814     int r, is_depth_stencil = (surf->flags & zs_flags) == zs_flags;
815     /* Old libdrm_macros.headers didn't have stencil_level in it. This prevents crashes. */
816     struct radeon_surface_level tmp[RADEON_SURF_MAX_LEVEL];
817     struct radeon_surface_level *stencil_level =
818         (surf->flags & RADEON_SURF_HAS_SBUFFER_MIPTREE) ? surf->stencil_level : tmp;
819 
820     r = eg_surface_init_2d(surf_man, surf, surf->level, surf->bpe,
821                            surf->tile_split, 0, 0);
822     if (r)
823         return r;
824 
825     if (is_depth_stencil) {
826         r = eg_surface_init_2d(surf_man, surf, stencil_level, 1,
827                                surf->stencil_tile_split, surf->bo_size, 0);
828         surf->stencil_offset = stencil_level[0].offset;
829     }
830     return r;
831 }
832 
eg_surface_init(struct radeon_surface_manager * surf_man,struct radeon_surface * surf)833 static int eg_surface_init(struct radeon_surface_manager *surf_man,
834                            struct radeon_surface *surf)
835 {
836     unsigned mode;
837     int r;
838 
839     /* MSAA surfaces support the 2D mode only. */
840     if (surf->nsamples > 1) {
841         surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
842         surf->flags |= RADEON_SURF_SET(RADEON_SURF_MODE_2D, MODE);
843     }
844 
845     /* tiling mode */
846     mode = (surf->flags >> RADEON_SURF_MODE_SHIFT) & RADEON_SURF_MODE_MASK;
847 
848     if (surf->flags & (RADEON_SURF_ZBUFFER | RADEON_SURF_SBUFFER)) {
849         /* zbuffer only support 1D or 2D tiled surface */
850         switch (mode) {
851         case RADEON_SURF_MODE_1D:
852         case RADEON_SURF_MODE_2D:
853             break;
854         default:
855             mode = RADEON_SURF_MODE_1D;
856             surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
857             surf->flags |= RADEON_SURF_SET(RADEON_SURF_MODE_1D, MODE);
858             break;
859         }
860     }
861 
862     r = eg_surface_sanity(surf_man, surf, mode);
863     if (r) {
864         return r;
865     }
866 
867     surf->stencil_offset = 0;
868     surf->bo_alignment = 0;
869 
870     /* check tiling mode */
871     switch (mode) {
872     case RADEON_SURF_MODE_LINEAR:
873         r = r6_surface_init_linear(surf_man, surf, 0, 0);
874         break;
875     case RADEON_SURF_MODE_LINEAR_ALIGNED:
876         r = r6_surface_init_linear_aligned(surf_man, surf, 0, 0);
877         break;
878     case RADEON_SURF_MODE_1D:
879         r = eg_surface_init_1d_miptrees(surf_man, surf);
880         break;
881     case RADEON_SURF_MODE_2D:
882         r = eg_surface_init_2d_miptrees(surf_man, surf);
883         break;
884     default:
885         return -EINVAL;
886     }
887     return r;
888 }
889 
log2_int(unsigned x)890 static unsigned log2_int(unsigned x)
891 {
892     unsigned l;
893 
894     if (x < 2) {
895         return 0;
896     }
897     for (l = 2; ; l++) {
898         if ((unsigned)(1 << l) > x) {
899             return l - 1;
900         }
901     }
902     return 0;
903 }
904 
905 /* compute best tile_split, bankw, bankh, mtilea
906  * depending on surface
907  */
eg_surface_best(struct radeon_surface_manager * surf_man,struct radeon_surface * surf)908 static int eg_surface_best(struct radeon_surface_manager *surf_man,
909                            struct radeon_surface *surf)
910 {
911     unsigned mode, tileb, h_over_w;
912     int r;
913 
914     /* tiling mode */
915     mode = (surf->flags >> RADEON_SURF_MODE_SHIFT) & RADEON_SURF_MODE_MASK;
916 
917     /* set some default value to avoid sanity check choking on them */
918     surf->tile_split = 1024;
919     surf->bankw = 1;
920     surf->bankh = 1;
921     surf->mtilea = surf_man->hw_info.num_banks;
922     tileb = MIN2(surf->tile_split, 64 * surf->bpe * surf->nsamples);
923     for (; surf->bankh <= 8; surf->bankh *= 2) {
924         if ((tileb * surf->bankh * surf->bankw) >= surf_man->hw_info.group_bytes) {
925             break;
926         }
927     }
928     if (surf->mtilea > 8) {
929         surf->mtilea = 8;
930     }
931 
932     r = eg_surface_sanity(surf_man, surf, mode);
933     if (r) {
934         return r;
935     }
936 
937     if (mode != RADEON_SURF_MODE_2D) {
938         /* nothing to do for non 2D tiled surface */
939         return 0;
940     }
941 
942     /* Tweak TILE_SPLIT for performance here. */
943     if (surf->nsamples > 1) {
944         if (surf->flags & (RADEON_SURF_ZBUFFER | RADEON_SURF_SBUFFER)) {
945             switch (surf->nsamples) {
946             case 2:
947                 surf->tile_split = 128;
948                 break;
949             case 4:
950                 surf->tile_split = 128;
951                 break;
952             case 8:
953                 surf->tile_split = 256;
954                 break;
955             case 16: /* cayman only */
956                 surf->tile_split = 512;
957                 break;
958             default:
959                 fprintf(stderr, "radeon: Wrong number of samples %i (%i)\n",
960                         surf->nsamples, __LINE__);
961                 return -EINVAL;
962             }
963             surf->stencil_tile_split = 64;
964         } else {
965             /* tile split must be >= 256 for colorbuffer surfaces,
966              * SAMPLE_SPLIT = tile_split / (bpe * 64), the optimal value is 2
967              */
968             surf->tile_split = MAX2(2 * surf->bpe * 64, 256);
969             if (surf->tile_split > 4096)
970                 surf->tile_split = 4096;
971         }
972     } else {
973         /* set tile split to row size */
974         surf->tile_split = surf_man->hw_info.row_size;
975         surf->stencil_tile_split = surf_man->hw_info.row_size / 2;
976     }
977 
978     /* bankw or bankh greater than 1 increase alignment requirement, not
979      * sure if it's worth using smaller bankw & bankh to stick with 2D
980      * tiling on small surface rather than falling back to 1D tiling.
981      * Use recommended value based on tile size for now.
982      *
983      * fmask buffer has different optimal value figure them out once we
984      * use it.
985      */
986     if (surf->flags & RADEON_SURF_SBUFFER) {
987         /* assume 1 bytes for stencil, we optimize for stencil as stencil
988          * and depth shares surface values
989          */
990         tileb = MIN2(surf->tile_split, 64 * surf->nsamples);
991     } else {
992         tileb = MIN2(surf->tile_split, 64 * surf->bpe * surf->nsamples);
993     }
994 
995     /* use bankw of 1 to minimize width alignment, might be interesting to
996      * increase it for large surface
997      */
998     surf->bankw = 1;
999     switch (tileb) {
1000     case 64:
1001         surf->bankh = 4;
1002         break;
1003     case 128:
1004     case 256:
1005         surf->bankh = 2;
1006         break;
1007     default:
1008         surf->bankh = 1;
1009         break;
1010     }
1011     /* double check the constraint */
1012     for (; surf->bankh <= 8; surf->bankh *= 2) {
1013         if ((tileb * surf->bankh * surf->bankw) >= surf_man->hw_info.group_bytes) {
1014             break;
1015         }
1016     }
1017 
1018     h_over_w = (((surf->bankh * surf_man->hw_info.num_banks) << 16) /
1019                 (surf->bankw * surf_man->hw_info.num_pipes)) >> 16;
1020     surf->mtilea = 1 << (log2_int(h_over_w) >> 1);
1021 
1022     return 0;
1023 }
1024 
1025 
1026 /* ===========================================================================
1027  * Southern Islands family
1028  */
1029 #define SI__GB_TILE_MODE__PIPE_CONFIG(x)        (((x) >> 6) & 0x1f)
1030 #define     SI__PIPE_CONFIG__ADDR_SURF_P2               0
1031 #define     SI__PIPE_CONFIG__ADDR_SURF_P4_8x16          4
1032 #define     SI__PIPE_CONFIG__ADDR_SURF_P4_16x16         5
1033 #define     SI__PIPE_CONFIG__ADDR_SURF_P4_16x32         6
1034 #define     SI__PIPE_CONFIG__ADDR_SURF_P4_32x32         7
1035 #define     SI__PIPE_CONFIG__ADDR_SURF_P8_16x16_8x16    8
1036 #define     SI__PIPE_CONFIG__ADDR_SURF_P8_16x32_8x16    9
1037 #define     SI__PIPE_CONFIG__ADDR_SURF_P8_32x32_8x16    10
1038 #define     SI__PIPE_CONFIG__ADDR_SURF_P8_16x32_16x16   11
1039 #define     SI__PIPE_CONFIG__ADDR_SURF_P8_32x32_16x16   12
1040 #define     SI__PIPE_CONFIG__ADDR_SURF_P8_32x32_16x32   13
1041 #define     SI__PIPE_CONFIG__ADDR_SURF_P8_32x64_32x32   14
1042 #define SI__GB_TILE_MODE__TILE_SPLIT(x)         (((x) >> 11) & 0x7)
1043 #define     SI__TILE_SPLIT__64B                         0
1044 #define     SI__TILE_SPLIT__128B                        1
1045 #define     SI__TILE_SPLIT__256B                        2
1046 #define     SI__TILE_SPLIT__512B                        3
1047 #define     SI__TILE_SPLIT__1024B                       4
1048 #define     SI__TILE_SPLIT__2048B                       5
1049 #define     SI__TILE_SPLIT__4096B                       6
1050 #define SI__GB_TILE_MODE__BANK_WIDTH(x)         (((x) >> 14) & 0x3)
1051 #define     SI__BANK_WIDTH__1                           0
1052 #define     SI__BANK_WIDTH__2                           1
1053 #define     SI__BANK_WIDTH__4                           2
1054 #define     SI__BANK_WIDTH__8                           3
1055 #define SI__GB_TILE_MODE__BANK_HEIGHT(x)        (((x) >> 16) & 0x3)
1056 #define     SI__BANK_HEIGHT__1                          0
1057 #define     SI__BANK_HEIGHT__2                          1
1058 #define     SI__BANK_HEIGHT__4                          2
1059 #define     SI__BANK_HEIGHT__8                          3
1060 #define SI__GB_TILE_MODE__MACRO_TILE_ASPECT(x)  (((x) >> 18) & 0x3)
1061 #define     SI__MACRO_TILE_ASPECT__1                    0
1062 #define     SI__MACRO_TILE_ASPECT__2                    1
1063 #define     SI__MACRO_TILE_ASPECT__4                    2
1064 #define     SI__MACRO_TILE_ASPECT__8                    3
1065 #define SI__GB_TILE_MODE__NUM_BANKS(x)          (((x) >> 20) & 0x3)
1066 #define     SI__NUM_BANKS__2_BANK                       0
1067 #define     SI__NUM_BANKS__4_BANK                       1
1068 #define     SI__NUM_BANKS__8_BANK                       2
1069 #define     SI__NUM_BANKS__16_BANK                      3
1070 
1071 
si_gb_tile_mode(uint32_t gb_tile_mode,unsigned * num_pipes,unsigned * num_banks,uint32_t * macro_tile_aspect,uint32_t * bank_w,uint32_t * bank_h,uint32_t * tile_split)1072 static void si_gb_tile_mode(uint32_t gb_tile_mode,
1073                             unsigned *num_pipes,
1074                             unsigned *num_banks,
1075                             uint32_t *macro_tile_aspect,
1076                             uint32_t *bank_w,
1077                             uint32_t *bank_h,
1078                             uint32_t *tile_split)
1079 {
1080     if (num_pipes) {
1081         switch (SI__GB_TILE_MODE__PIPE_CONFIG(gb_tile_mode)) {
1082         case SI__PIPE_CONFIG__ADDR_SURF_P2:
1083         default:
1084             *num_pipes = 2;
1085             break;
1086         case SI__PIPE_CONFIG__ADDR_SURF_P4_8x16:
1087         case SI__PIPE_CONFIG__ADDR_SURF_P4_16x16:
1088         case SI__PIPE_CONFIG__ADDR_SURF_P4_16x32:
1089         case SI__PIPE_CONFIG__ADDR_SURF_P4_32x32:
1090             *num_pipes = 4;
1091             break;
1092         case SI__PIPE_CONFIG__ADDR_SURF_P8_16x16_8x16:
1093         case SI__PIPE_CONFIG__ADDR_SURF_P8_16x32_8x16:
1094         case SI__PIPE_CONFIG__ADDR_SURF_P8_32x32_8x16:
1095         case SI__PIPE_CONFIG__ADDR_SURF_P8_16x32_16x16:
1096         case SI__PIPE_CONFIG__ADDR_SURF_P8_32x32_16x16:
1097         case SI__PIPE_CONFIG__ADDR_SURF_P8_32x32_16x32:
1098         case SI__PIPE_CONFIG__ADDR_SURF_P8_32x64_32x32:
1099             *num_pipes = 8;
1100             break;
1101         }
1102     }
1103     if (num_banks) {
1104         switch (SI__GB_TILE_MODE__NUM_BANKS(gb_tile_mode)) {
1105         default:
1106         case SI__NUM_BANKS__2_BANK:
1107             *num_banks = 2;
1108             break;
1109         case SI__NUM_BANKS__4_BANK:
1110             *num_banks = 4;
1111             break;
1112         case SI__NUM_BANKS__8_BANK:
1113             *num_banks = 8;
1114             break;
1115         case SI__NUM_BANKS__16_BANK:
1116             *num_banks = 16;
1117             break;
1118         }
1119     }
1120     if (macro_tile_aspect) {
1121         switch (SI__GB_TILE_MODE__MACRO_TILE_ASPECT(gb_tile_mode)) {
1122         default:
1123         case SI__MACRO_TILE_ASPECT__1:
1124             *macro_tile_aspect = 1;
1125             break;
1126         case SI__MACRO_TILE_ASPECT__2:
1127             *macro_tile_aspect = 2;
1128             break;
1129         case SI__MACRO_TILE_ASPECT__4:
1130             *macro_tile_aspect = 4;
1131             break;
1132         case SI__MACRO_TILE_ASPECT__8:
1133             *macro_tile_aspect = 8;
1134             break;
1135         }
1136     }
1137     if (bank_w) {
1138         switch (SI__GB_TILE_MODE__BANK_WIDTH(gb_tile_mode)) {
1139         default:
1140         case SI__BANK_WIDTH__1:
1141             *bank_w = 1;
1142             break;
1143         case SI__BANK_WIDTH__2:
1144             *bank_w = 2;
1145             break;
1146         case SI__BANK_WIDTH__4:
1147             *bank_w = 4;
1148             break;
1149         case SI__BANK_WIDTH__8:
1150             *bank_w = 8;
1151             break;
1152         }
1153     }
1154     if (bank_h) {
1155         switch (SI__GB_TILE_MODE__BANK_HEIGHT(gb_tile_mode)) {
1156         default:
1157         case SI__BANK_HEIGHT__1:
1158             *bank_h = 1;
1159             break;
1160         case SI__BANK_HEIGHT__2:
1161             *bank_h = 2;
1162             break;
1163         case SI__BANK_HEIGHT__4:
1164             *bank_h = 4;
1165             break;
1166         case SI__BANK_HEIGHT__8:
1167             *bank_h = 8;
1168             break;
1169         }
1170     }
1171     if (tile_split) {
1172         switch (SI__GB_TILE_MODE__TILE_SPLIT(gb_tile_mode)) {
1173         default:
1174         case SI__TILE_SPLIT__64B:
1175             *tile_split = 64;
1176             break;
1177         case SI__TILE_SPLIT__128B:
1178             *tile_split = 128;
1179             break;
1180         case SI__TILE_SPLIT__256B:
1181             *tile_split = 256;
1182             break;
1183         case SI__TILE_SPLIT__512B:
1184             *tile_split = 512;
1185             break;
1186         case SI__TILE_SPLIT__1024B:
1187             *tile_split = 1024;
1188             break;
1189         case SI__TILE_SPLIT__2048B:
1190             *tile_split = 2048;
1191             break;
1192         case SI__TILE_SPLIT__4096B:
1193             *tile_split = 4096;
1194             break;
1195         }
1196     }
1197 }
1198 
si_init_hw_info(struct radeon_surface_manager * surf_man)1199 static int si_init_hw_info(struct radeon_surface_manager *surf_man)
1200 {
1201     uint32_t tiling_config;
1202     drmVersionPtr version;
1203     int r;
1204 
1205     r = radeon_get_value(surf_man->fd, RADEON_INFO_TILING_CONFIG,
1206                          &tiling_config);
1207     if (r) {
1208         return r;
1209     }
1210 
1211     surf_man->hw_info.allow_2d = 0;
1212     version = drmGetVersion(surf_man->fd);
1213     if (version && version->version_minor >= 33) {
1214         if (!radeon_get_value(surf_man->fd, RADEON_INFO_SI_TILE_MODE_ARRAY, surf_man->hw_info.tile_mode_array)) {
1215             surf_man->hw_info.allow_2d = 1;
1216         }
1217     }
1218     drmFreeVersion(version);
1219 
1220     switch (tiling_config & 0xf) {
1221     case 0:
1222         surf_man->hw_info.num_pipes = 1;
1223         break;
1224     case 1:
1225         surf_man->hw_info.num_pipes = 2;
1226         break;
1227     case 2:
1228         surf_man->hw_info.num_pipes = 4;
1229         break;
1230     case 3:
1231         surf_man->hw_info.num_pipes = 8;
1232         break;
1233     default:
1234         surf_man->hw_info.num_pipes = 8;
1235         surf_man->hw_info.allow_2d = 0;
1236         break;
1237     }
1238 
1239     switch ((tiling_config & 0xf0) >> 4) {
1240     case 0:
1241         surf_man->hw_info.num_banks = 4;
1242         break;
1243     case 1:
1244         surf_man->hw_info.num_banks = 8;
1245         break;
1246     case 2:
1247         surf_man->hw_info.num_banks = 16;
1248         break;
1249     default:
1250         surf_man->hw_info.num_banks = 8;
1251         surf_man->hw_info.allow_2d = 0;
1252         break;
1253     }
1254 
1255     switch ((tiling_config & 0xf00) >> 8) {
1256     case 0:
1257         surf_man->hw_info.group_bytes = 256;
1258         break;
1259     case 1:
1260         surf_man->hw_info.group_bytes = 512;
1261         break;
1262     default:
1263         surf_man->hw_info.group_bytes = 256;
1264         surf_man->hw_info.allow_2d = 0;
1265         break;
1266     }
1267 
1268     switch ((tiling_config & 0xf000) >> 12) {
1269     case 0:
1270         surf_man->hw_info.row_size = 1024;
1271         break;
1272     case 1:
1273         surf_man->hw_info.row_size = 2048;
1274         break;
1275     case 2:
1276         surf_man->hw_info.row_size = 4096;
1277         break;
1278     default:
1279         surf_man->hw_info.row_size = 4096;
1280         surf_man->hw_info.allow_2d = 0;
1281         break;
1282     }
1283     return 0;
1284 }
1285 
si_surface_sanity(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,unsigned mode,unsigned * tile_mode,unsigned * stencil_tile_mode)1286 static int si_surface_sanity(struct radeon_surface_manager *surf_man,
1287                              struct radeon_surface *surf,
1288                              unsigned mode, unsigned *tile_mode, unsigned *stencil_tile_mode)
1289 {
1290     uint32_t gb_tile_mode;
1291 
1292     /* check surface dimension */
1293     if (surf->npix_x > 16384 || surf->npix_y > 16384 || surf->npix_z > 16384) {
1294         return -EINVAL;
1295     }
1296 
1297     /* check mipmap last_level */
1298     if (surf->last_level > 15) {
1299         return -EINVAL;
1300     }
1301 
1302     /* force 1d on kernel that can't do 2d */
1303     if (mode > RADEON_SURF_MODE_1D &&
1304         (!surf_man->hw_info.allow_2d || !(surf->flags & RADEON_SURF_HAS_TILE_MODE_INDEX))) {
1305         if (surf->nsamples > 1) {
1306             fprintf(stderr, "radeon: Cannot use 1D tiling for an MSAA surface (%i).\n", __LINE__);
1307             return -EFAULT;
1308         }
1309         mode = RADEON_SURF_MODE_1D;
1310         surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
1311         surf->flags |= RADEON_SURF_SET(mode, MODE);
1312     }
1313 
1314     if (surf->nsamples > 1 && mode != RADEON_SURF_MODE_2D) {
1315         return -EINVAL;
1316     }
1317 
1318     if (!surf->tile_split) {
1319         /* default value */
1320         surf->mtilea = 1;
1321         surf->bankw = 1;
1322         surf->bankh = 1;
1323         surf->tile_split = 64;
1324         surf->stencil_tile_split = 64;
1325     }
1326 
1327     switch (mode) {
1328     case RADEON_SURF_MODE_2D:
1329         if (surf->flags & RADEON_SURF_SBUFFER) {
1330             switch (surf->nsamples) {
1331             case 1:
1332                 *stencil_tile_mode = SI_TILE_MODE_DEPTH_STENCIL_2D;
1333                 break;
1334             case 2:
1335                 *stencil_tile_mode = SI_TILE_MODE_DEPTH_STENCIL_2D_2AA;
1336                 break;
1337             case 4:
1338                 *stencil_tile_mode = SI_TILE_MODE_DEPTH_STENCIL_2D_4AA;
1339                 break;
1340             case 8:
1341                 *stencil_tile_mode = SI_TILE_MODE_DEPTH_STENCIL_2D_8AA;
1342                 break;
1343             default:
1344                 return -EINVAL;
1345             }
1346             /* retrieve tiling mode value */
1347             gb_tile_mode = surf_man->hw_info.tile_mode_array[*stencil_tile_mode];
1348             si_gb_tile_mode(gb_tile_mode, NULL, NULL, NULL, NULL, NULL, &surf->stencil_tile_split);
1349         }
1350         if (surf->flags & RADEON_SURF_ZBUFFER) {
1351             switch (surf->nsamples) {
1352             case 1:
1353                 *tile_mode = SI_TILE_MODE_DEPTH_STENCIL_2D;
1354                 break;
1355             case 2:
1356                 *tile_mode = SI_TILE_MODE_DEPTH_STENCIL_2D_2AA;
1357                 break;
1358             case 4:
1359                 *tile_mode = SI_TILE_MODE_DEPTH_STENCIL_2D_4AA;
1360                 break;
1361             case 8:
1362                 *tile_mode = SI_TILE_MODE_DEPTH_STENCIL_2D_8AA;
1363                 break;
1364             default:
1365                 return -EINVAL;
1366             }
1367         } else if (surf->flags & RADEON_SURF_SCANOUT) {
1368             switch (surf->bpe) {
1369             case 2:
1370                 *tile_mode = SI_TILE_MODE_COLOR_2D_SCANOUT_16BPP;
1371                 break;
1372             case 4:
1373                 *tile_mode = SI_TILE_MODE_COLOR_2D_SCANOUT_32BPP;
1374                 break;
1375             default:
1376                 return -EINVAL;
1377             }
1378         } else {
1379             switch (surf->bpe) {
1380             case 1:
1381                 *tile_mode = SI_TILE_MODE_COLOR_2D_8BPP;
1382                 break;
1383             case 2:
1384                 *tile_mode = SI_TILE_MODE_COLOR_2D_16BPP;
1385                 break;
1386             case 4:
1387                 *tile_mode = SI_TILE_MODE_COLOR_2D_32BPP;
1388                 break;
1389             case 8:
1390             case 16:
1391                 *tile_mode = SI_TILE_MODE_COLOR_2D_64BPP;
1392                 break;
1393             default:
1394                 return -EINVAL;
1395             }
1396         }
1397         /* retrieve tiling mode value */
1398         gb_tile_mode = surf_man->hw_info.tile_mode_array[*tile_mode];
1399         si_gb_tile_mode(gb_tile_mode, NULL, NULL, &surf->mtilea, &surf->bankw, &surf->bankh, &surf->tile_split);
1400         break;
1401     case RADEON_SURF_MODE_1D:
1402         if (surf->flags & RADEON_SURF_SBUFFER) {
1403             *stencil_tile_mode = SI_TILE_MODE_DEPTH_STENCIL_1D;
1404         }
1405         if (surf->flags & RADEON_SURF_ZBUFFER) {
1406             *tile_mode = SI_TILE_MODE_DEPTH_STENCIL_1D;
1407         } else if (surf->flags & RADEON_SURF_SCANOUT) {
1408             *tile_mode = SI_TILE_MODE_COLOR_1D_SCANOUT;
1409         } else {
1410             *tile_mode = SI_TILE_MODE_COLOR_1D;
1411         }
1412         break;
1413     case RADEON_SURF_MODE_LINEAR_ALIGNED:
1414     default:
1415         *tile_mode = SI_TILE_MODE_COLOR_LINEAR_ALIGNED;
1416     }
1417 
1418     return 0;
1419 }
1420 
si_surf_minify(struct radeon_surface * surf,struct radeon_surface_level * surflevel,unsigned bpe,unsigned level,uint32_t xalign,uint32_t yalign,uint32_t zalign,uint32_t slice_align,uint64_t offset)1421 static void si_surf_minify(struct radeon_surface *surf,
1422                            struct radeon_surface_level *surflevel,
1423                            unsigned bpe, unsigned level,
1424                            uint32_t xalign, uint32_t yalign, uint32_t zalign,
1425                            uint32_t slice_align, uint64_t offset)
1426 {
1427     if (level == 0) {
1428         surflevel->npix_x = surf->npix_x;
1429     } else {
1430         surflevel->npix_x = mip_minify(next_power_of_two(surf->npix_x), level);
1431     }
1432     surflevel->npix_y = mip_minify(surf->npix_y, level);
1433     surflevel->npix_z = mip_minify(surf->npix_z, level);
1434 
1435     if (level == 0 && surf->last_level > 0) {
1436         surflevel->nblk_x = (next_power_of_two(surflevel->npix_x) + surf->blk_w - 1) / surf->blk_w;
1437         surflevel->nblk_y = (next_power_of_two(surflevel->npix_y) + surf->blk_h - 1) / surf->blk_h;
1438         surflevel->nblk_z = (next_power_of_two(surflevel->npix_z) + surf->blk_d - 1) / surf->blk_d;
1439     } else {
1440         surflevel->nblk_x = (surflevel->npix_x + surf->blk_w - 1) / surf->blk_w;
1441         surflevel->nblk_y = (surflevel->npix_y + surf->blk_h - 1) / surf->blk_h;
1442         surflevel->nblk_z = (surflevel->npix_z + surf->blk_d - 1) / surf->blk_d;
1443     }
1444 
1445     surflevel->nblk_y  = ALIGN(surflevel->nblk_y, yalign);
1446 
1447     /* XXX: Texture sampling uses unexpectedly large pitches in some cases,
1448      * these are just guesses for the rules behind those
1449      */
1450     if (level == 0 && surf->last_level == 0)
1451         /* Non-mipmap pitch padded to slice alignment */
1452         /* Using just bpe here breaks stencil blitting; surf->bpe works. */
1453         xalign = MAX2(xalign, slice_align / surf->bpe);
1454     else if (surflevel->mode == RADEON_SURF_MODE_LINEAR_ALIGNED)
1455         /* Small rows evenly distributed across slice */
1456         xalign = MAX2(xalign, slice_align / bpe / surflevel->nblk_y);
1457 
1458     surflevel->nblk_x  = ALIGN(surflevel->nblk_x, xalign);
1459     surflevel->nblk_z  = ALIGN(surflevel->nblk_z, zalign);
1460 
1461     surflevel->offset = offset;
1462     surflevel->pitch_bytes = surflevel->nblk_x * bpe * surf->nsamples;
1463     surflevel->slice_size = ALIGN((uint64_t)surflevel->pitch_bytes * surflevel->nblk_y,
1464 				  (uint64_t)slice_align);
1465 
1466     surf->bo_size = offset + surflevel->slice_size * surflevel->nblk_z * surf->array_size;
1467 }
1468 
si_surf_minify_2d(struct radeon_surface * surf,struct radeon_surface_level * surflevel,unsigned bpe,unsigned level,unsigned slice_pt,uint32_t xalign,uint32_t yalign,uint32_t zalign,unsigned mtileb,uint64_t offset)1469 static void si_surf_minify_2d(struct radeon_surface *surf,
1470                               struct radeon_surface_level *surflevel,
1471                               unsigned bpe, unsigned level, unsigned slice_pt,
1472                               uint32_t xalign, uint32_t yalign, uint32_t zalign,
1473                               unsigned mtileb, uint64_t offset)
1474 {
1475     unsigned mtile_pr, mtile_ps;
1476 
1477     if (level == 0) {
1478         surflevel->npix_x = surf->npix_x;
1479     } else {
1480         surflevel->npix_x = mip_minify(next_power_of_two(surf->npix_x), level);
1481     }
1482     surflevel->npix_y = mip_minify(surf->npix_y, level);
1483     surflevel->npix_z = mip_minify(surf->npix_z, level);
1484 
1485     if (level == 0 && surf->last_level > 0) {
1486         surflevel->nblk_x = (next_power_of_two(surflevel->npix_x) + surf->blk_w - 1) / surf->blk_w;
1487         surflevel->nblk_y = (next_power_of_two(surflevel->npix_y) + surf->blk_h - 1) / surf->blk_h;
1488         surflevel->nblk_z = (next_power_of_two(surflevel->npix_z) + surf->blk_d - 1) / surf->blk_d;
1489     } else {
1490         surflevel->nblk_x = (surflevel->npix_x + surf->blk_w - 1) / surf->blk_w;
1491         surflevel->nblk_y = (surflevel->npix_y + surf->blk_h - 1) / surf->blk_h;
1492         surflevel->nblk_z = (surflevel->npix_z + surf->blk_d - 1) / surf->blk_d;
1493     }
1494 
1495     if (surf->nsamples == 1 && surflevel->mode == RADEON_SURF_MODE_2D &&
1496         !(surf->flags & RADEON_SURF_FMASK)) {
1497         if (surflevel->nblk_x < xalign || surflevel->nblk_y < yalign) {
1498             surflevel->mode = RADEON_SURF_MODE_1D;
1499             return;
1500         }
1501     }
1502     surflevel->nblk_x  = ALIGN(surflevel->nblk_x, xalign);
1503     surflevel->nblk_y  = ALIGN(surflevel->nblk_y, yalign);
1504     surflevel->nblk_z  = ALIGN(surflevel->nblk_z, zalign);
1505 
1506     /* macro tile per row */
1507     mtile_pr = surflevel->nblk_x / xalign;
1508     /* macro tile per slice */
1509     mtile_ps = (mtile_pr * surflevel->nblk_y) / yalign;
1510     surflevel->offset = offset;
1511     surflevel->pitch_bytes = surflevel->nblk_x * bpe * surf->nsamples;
1512     surflevel->slice_size = (uint64_t)mtile_ps * mtileb * slice_pt;
1513 
1514     surf->bo_size = offset + surflevel->slice_size * surflevel->nblk_z * surf->array_size;
1515 }
1516 
si_surface_init_linear_aligned(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,unsigned tile_mode,uint64_t offset,unsigned start_level)1517 static int si_surface_init_linear_aligned(struct radeon_surface_manager *surf_man,
1518                                           struct radeon_surface *surf,
1519                                           unsigned tile_mode,
1520                                           uint64_t offset, unsigned start_level)
1521 {
1522     uint32_t xalign, yalign, zalign, slice_align;
1523     unsigned i;
1524 
1525     /* compute alignment */
1526     if (!start_level) {
1527         surf->bo_alignment = MAX2(256, surf_man->hw_info.group_bytes);
1528     }
1529     xalign = MAX2(8, 64 / surf->bpe);
1530     yalign = 1;
1531     zalign = 1;
1532     slice_align = MAX2(64 * surf->bpe, surf_man->hw_info.group_bytes);
1533 
1534     /* build mipmap tree */
1535     for (i = start_level; i <= surf->last_level; i++) {
1536         surf->level[i].mode = RADEON_SURF_MODE_LINEAR_ALIGNED;
1537         si_surf_minify(surf, surf->level+i, surf->bpe, i, xalign, yalign, zalign, slice_align, offset);
1538         /* level0 and first mipmap need to have alignment */
1539         offset = surf->bo_size;
1540         if (i == 0) {
1541             offset = ALIGN(offset, surf->bo_alignment);
1542         }
1543         if (surf->flags & RADEON_SURF_HAS_TILE_MODE_INDEX) {
1544             surf->tiling_index[i] = tile_mode;
1545         }
1546     }
1547     return 0;
1548 }
1549 
si_surface_init_1d(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,struct radeon_surface_level * level,unsigned bpe,unsigned tile_mode,uint64_t offset,unsigned start_level)1550 static int si_surface_init_1d(struct radeon_surface_manager *surf_man,
1551                               struct radeon_surface *surf,
1552                               struct radeon_surface_level *level,
1553                               unsigned bpe, unsigned tile_mode,
1554                               uint64_t offset, unsigned start_level)
1555 {
1556     uint32_t xalign, yalign, zalign, slice_align;
1557     unsigned alignment = MAX2(256, surf_man->hw_info.group_bytes);
1558     unsigned i;
1559 
1560     /* compute alignment */
1561     xalign = 8;
1562     yalign = 8;
1563     zalign = 1;
1564     slice_align = surf_man->hw_info.group_bytes;
1565     if (surf->flags & RADEON_SURF_SCANOUT) {
1566         xalign = MAX2((bpe == 1) ? 64 : 32, xalign);
1567     }
1568 
1569     if (start_level <= 1) {
1570         surf->bo_alignment = MAX2(surf->bo_alignment, alignment);
1571 
1572         if (offset) {
1573             offset = ALIGN(offset, alignment);
1574         }
1575     }
1576 
1577     /* build mipmap tree */
1578     for (i = start_level; i <= surf->last_level; i++) {
1579         level[i].mode = RADEON_SURF_MODE_1D;
1580         si_surf_minify(surf, level+i, bpe, i, xalign, yalign, zalign, slice_align, offset);
1581         /* level0 and first mipmap need to have alignment */
1582         offset = surf->bo_size;
1583         if (i == 0) {
1584             offset = ALIGN(offset, alignment);
1585         }
1586         if (surf->flags & RADEON_SURF_HAS_TILE_MODE_INDEX) {
1587             if (surf->level == level) {
1588                 surf->tiling_index[i] = tile_mode;
1589                 /* it's ok because stencil is done after */
1590                 surf->stencil_tiling_index[i] = tile_mode;
1591             } else {
1592                 surf->stencil_tiling_index[i] = tile_mode;
1593             }
1594         }
1595     }
1596     return 0;
1597 }
1598 
si_surface_init_1d_miptrees(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,unsigned tile_mode,unsigned stencil_tile_mode)1599 static int si_surface_init_1d_miptrees(struct radeon_surface_manager *surf_man,
1600                                        struct radeon_surface *surf,
1601                                        unsigned tile_mode, unsigned stencil_tile_mode)
1602 {
1603     int r;
1604 
1605     r = si_surface_init_1d(surf_man, surf, surf->level, surf->bpe, tile_mode, 0, 0);
1606     if (r) {
1607         return r;
1608     }
1609 
1610     if (surf->flags & RADEON_SURF_SBUFFER) {
1611         r = si_surface_init_1d(surf_man, surf, surf->stencil_level, 1, stencil_tile_mode, surf->bo_size, 0);
1612         surf->stencil_offset = surf->stencil_level[0].offset;
1613     }
1614     return r;
1615 }
1616 
si_surface_init_2d(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,struct radeon_surface_level * level,unsigned bpe,unsigned tile_mode,unsigned num_pipes,unsigned num_banks,unsigned tile_split,uint64_t offset,unsigned start_level)1617 static int si_surface_init_2d(struct radeon_surface_manager *surf_man,
1618                               struct radeon_surface *surf,
1619                               struct radeon_surface_level *level,
1620                               unsigned bpe, unsigned tile_mode,
1621                               unsigned num_pipes, unsigned num_banks,
1622                               unsigned tile_split,
1623                               uint64_t offset,
1624                               unsigned start_level)
1625 {
1626     uint64_t aligned_offset = offset;
1627     unsigned tilew, tileh, tileb;
1628     unsigned mtilew, mtileh, mtileb;
1629     unsigned slice_pt;
1630     unsigned i;
1631 
1632     /* compute tile values */
1633     tilew = 8;
1634     tileh = 8;
1635     tileb = tilew * tileh * bpe * surf->nsamples;
1636     /* slices per tile */
1637     slice_pt = 1;
1638     if (tileb > tile_split && tile_split) {
1639         slice_pt = tileb / tile_split;
1640     }
1641     tileb = tileb / slice_pt;
1642 
1643     /* macro tile width & height */
1644     mtilew = (tilew * surf->bankw * num_pipes) * surf->mtilea;
1645     mtileh = (tileh * surf->bankh * num_banks) / surf->mtilea;
1646 
1647     /* macro tile bytes */
1648     mtileb = (mtilew / tilew) * (mtileh / tileh) * tileb;
1649 
1650     if (start_level <= 1) {
1651         unsigned alignment = MAX2(256, mtileb);
1652         surf->bo_alignment = MAX2(surf->bo_alignment, alignment);
1653 
1654         if (aligned_offset) {
1655             aligned_offset = ALIGN(aligned_offset, alignment);
1656         }
1657     }
1658 
1659     /* build mipmap tree */
1660     for (i = start_level; i <= surf->last_level; i++) {
1661         level[i].mode = RADEON_SURF_MODE_2D;
1662         si_surf_minify_2d(surf, level+i, bpe, i, slice_pt, mtilew, mtileh, 1, mtileb, aligned_offset);
1663         if (level[i].mode == RADEON_SURF_MODE_1D) {
1664             switch (tile_mode) {
1665             case SI_TILE_MODE_COLOR_2D_8BPP:
1666             case SI_TILE_MODE_COLOR_2D_16BPP:
1667             case SI_TILE_MODE_COLOR_2D_32BPP:
1668             case SI_TILE_MODE_COLOR_2D_64BPP:
1669                 tile_mode = SI_TILE_MODE_COLOR_1D;
1670                 break;
1671             case SI_TILE_MODE_COLOR_2D_SCANOUT_16BPP:
1672             case SI_TILE_MODE_COLOR_2D_SCANOUT_32BPP:
1673                 tile_mode = SI_TILE_MODE_COLOR_1D_SCANOUT;
1674                 break;
1675             case SI_TILE_MODE_DEPTH_STENCIL_2D:
1676                 tile_mode = SI_TILE_MODE_DEPTH_STENCIL_1D;
1677                 break;
1678             default:
1679                 return -EINVAL;
1680             }
1681             return si_surface_init_1d(surf_man, surf, level, bpe, tile_mode, offset, i);
1682         }
1683         /* level0 and first mipmap need to have alignment */
1684         aligned_offset = offset = surf->bo_size;
1685         if (i == 0) {
1686             aligned_offset = ALIGN(aligned_offset, surf->bo_alignment);
1687         }
1688         if (surf->flags & RADEON_SURF_HAS_TILE_MODE_INDEX) {
1689             if (surf->level == level) {
1690                 surf->tiling_index[i] = tile_mode;
1691                 /* it's ok because stencil is done after */
1692                 surf->stencil_tiling_index[i] = tile_mode;
1693             } else {
1694                 surf->stencil_tiling_index[i] = tile_mode;
1695             }
1696         }
1697     }
1698     return 0;
1699 }
1700 
si_surface_init_2d_miptrees(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,unsigned tile_mode,unsigned stencil_tile_mode)1701 static int si_surface_init_2d_miptrees(struct radeon_surface_manager *surf_man,
1702                                        struct radeon_surface *surf,
1703                                        unsigned tile_mode, unsigned stencil_tile_mode)
1704 {
1705     unsigned num_pipes, num_banks;
1706     uint32_t gb_tile_mode;
1707     int r;
1708 
1709     /* retrieve tiling mode value */
1710     gb_tile_mode = surf_man->hw_info.tile_mode_array[tile_mode];
1711     si_gb_tile_mode(gb_tile_mode, &num_pipes, &num_banks, NULL, NULL, NULL, NULL);
1712 
1713     r = si_surface_init_2d(surf_man, surf, surf->level, surf->bpe, tile_mode, num_pipes, num_banks, surf->tile_split, 0, 0);
1714     if (r) {
1715         return r;
1716     }
1717 
1718     if (surf->flags & RADEON_SURF_SBUFFER) {
1719         r = si_surface_init_2d(surf_man, surf, surf->stencil_level, 1, stencil_tile_mode, num_pipes, num_banks, surf->stencil_tile_split, surf->bo_size, 0);
1720         surf->stencil_offset = surf->stencil_level[0].offset;
1721     }
1722     return r;
1723 }
1724 
si_surface_init(struct radeon_surface_manager * surf_man,struct radeon_surface * surf)1725 static int si_surface_init(struct radeon_surface_manager *surf_man,
1726                            struct radeon_surface *surf)
1727 {
1728     unsigned mode, tile_mode, stencil_tile_mode;
1729     int r;
1730 
1731     /* MSAA surfaces support the 2D mode only. */
1732     if (surf->nsamples > 1) {
1733         surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
1734         surf->flags |= RADEON_SURF_SET(RADEON_SURF_MODE_2D, MODE);
1735     }
1736 
1737     /* tiling mode */
1738     mode = (surf->flags >> RADEON_SURF_MODE_SHIFT) & RADEON_SURF_MODE_MASK;
1739 
1740     if (surf->flags & (RADEON_SURF_ZBUFFER | RADEON_SURF_SBUFFER)) {
1741         /* zbuffer only support 1D or 2D tiled surface */
1742         switch (mode) {
1743         case RADEON_SURF_MODE_1D:
1744         case RADEON_SURF_MODE_2D:
1745             break;
1746         default:
1747             mode = RADEON_SURF_MODE_1D;
1748             surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
1749             surf->flags |= RADEON_SURF_SET(RADEON_SURF_MODE_1D, MODE);
1750             break;
1751         }
1752     }
1753 
1754     r = si_surface_sanity(surf_man, surf, mode, &tile_mode, &stencil_tile_mode);
1755     if (r) {
1756         return r;
1757     }
1758 
1759     surf->stencil_offset = 0;
1760     surf->bo_alignment = 0;
1761 
1762     /* check tiling mode */
1763     switch (mode) {
1764     case RADEON_SURF_MODE_LINEAR:
1765         r = r6_surface_init_linear(surf_man, surf, 0, 0);
1766         break;
1767     case RADEON_SURF_MODE_LINEAR_ALIGNED:
1768         r = si_surface_init_linear_aligned(surf_man, surf, tile_mode, 0, 0);
1769         break;
1770     case RADEON_SURF_MODE_1D:
1771         r = si_surface_init_1d_miptrees(surf_man, surf, tile_mode, stencil_tile_mode);
1772         break;
1773     case RADEON_SURF_MODE_2D:
1774         r = si_surface_init_2d_miptrees(surf_man, surf, tile_mode, stencil_tile_mode);
1775         break;
1776     default:
1777         return -EINVAL;
1778     }
1779     return r;
1780 }
1781 
1782 /*
1783  * depending on surface
1784  */
si_surface_best(struct radeon_surface_manager * surf_man,struct radeon_surface * surf)1785 static int si_surface_best(struct radeon_surface_manager *surf_man,
1786                            struct radeon_surface *surf)
1787 {
1788     unsigned mode, tile_mode, stencil_tile_mode;
1789 
1790     /* tiling mode */
1791     mode = (surf->flags >> RADEON_SURF_MODE_SHIFT) & RADEON_SURF_MODE_MASK;
1792 
1793     if (surf->flags & (RADEON_SURF_ZBUFFER | RADEON_SURF_SBUFFER) &&
1794         !(surf->flags & RADEON_SURF_HAS_TILE_MODE_INDEX)) {
1795         /* depth/stencil force 1d tiling for old mesa */
1796         surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
1797         surf->flags |= RADEON_SURF_SET(RADEON_SURF_MODE_1D, MODE);
1798     }
1799 
1800     return si_surface_sanity(surf_man, surf, mode, &tile_mode, &stencil_tile_mode);
1801 }
1802 
1803 
1804 /* ===========================================================================
1805  * Sea Islands family
1806  */
1807 #define CIK__GB_TILE_MODE__PIPE_CONFIG(x)        (((x) >> 6) & 0x1f)
1808 #define     CIK__PIPE_CONFIG__ADDR_SURF_P2               0
1809 #define     CIK__PIPE_CONFIG__ADDR_SURF_P4_8x16          4
1810 #define     CIK__PIPE_CONFIG__ADDR_SURF_P4_16x16         5
1811 #define     CIK__PIPE_CONFIG__ADDR_SURF_P4_16x32         6
1812 #define     CIK__PIPE_CONFIG__ADDR_SURF_P4_32x32         7
1813 #define     CIK__PIPE_CONFIG__ADDR_SURF_P8_16x16_8x16    8
1814 #define     CIK__PIPE_CONFIG__ADDR_SURF_P8_16x32_8x16    9
1815 #define     CIK__PIPE_CONFIG__ADDR_SURF_P8_32x32_8x16    10
1816 #define     CIK__PIPE_CONFIG__ADDR_SURF_P8_16x32_16x16   11
1817 #define     CIK__PIPE_CONFIG__ADDR_SURF_P8_32x32_16x16   12
1818 #define     CIK__PIPE_CONFIG__ADDR_SURF_P8_32x32_16x32   13
1819 #define     CIK__PIPE_CONFIG__ADDR_SURF_P8_32x64_32x32   14
1820 #define     CIK__PIPE_CONFIG__ADDR_SURF_P16_32X32_8X16   16
1821 #define     CIK__PIPE_CONFIG__ADDR_SURF_P16_32X32_16X16  17
1822 #define CIK__GB_TILE_MODE__TILE_SPLIT(x)         (((x) >> 11) & 0x7)
1823 #define     CIK__TILE_SPLIT__64B                         0
1824 #define     CIK__TILE_SPLIT__128B                        1
1825 #define     CIK__TILE_SPLIT__256B                        2
1826 #define     CIK__TILE_SPLIT__512B                        3
1827 #define     CIK__TILE_SPLIT__1024B                       4
1828 #define     CIK__TILE_SPLIT__2048B                       5
1829 #define     CIK__TILE_SPLIT__4096B                       6
1830 #define CIK__GB_TILE_MODE__SAMPLE_SPLIT(x)         (((x) >> 25) & 0x3)
1831 #define     CIK__SAMPLE_SPLIT__1                         0
1832 #define     CIK__SAMPLE_SPLIT__2                         1
1833 #define     CIK__SAMPLE_SPLIT__4                         2
1834 #define     CIK__SAMPLE_SPLIT__8                         3
1835 #define CIK__GB_MACROTILE_MODE__BANK_WIDTH(x)        ((x) & 0x3)
1836 #define     CIK__BANK_WIDTH__1                           0
1837 #define     CIK__BANK_WIDTH__2                           1
1838 #define     CIK__BANK_WIDTH__4                           2
1839 #define     CIK__BANK_WIDTH__8                           3
1840 #define CIK__GB_MACROTILE_MODE__BANK_HEIGHT(x)       (((x) >> 2) & 0x3)
1841 #define     CIK__BANK_HEIGHT__1                          0
1842 #define     CIK__BANK_HEIGHT__2                          1
1843 #define     CIK__BANK_HEIGHT__4                          2
1844 #define     CIK__BANK_HEIGHT__8                          3
1845 #define CIK__GB_MACROTILE_MODE__MACRO_TILE_ASPECT(x) (((x) >> 4) & 0x3)
1846 #define     CIK__MACRO_TILE_ASPECT__1                    0
1847 #define     CIK__MACRO_TILE_ASPECT__2                    1
1848 #define     CIK__MACRO_TILE_ASPECT__4                    2
1849 #define     CIK__MACRO_TILE_ASPECT__8                    3
1850 #define CIK__GB_MACROTILE_MODE__NUM_BANKS(x)         (((x) >> 6) & 0x3)
1851 #define     CIK__NUM_BANKS__2_BANK                       0
1852 #define     CIK__NUM_BANKS__4_BANK                       1
1853 #define     CIK__NUM_BANKS__8_BANK                       2
1854 #define     CIK__NUM_BANKS__16_BANK                      3
1855 
1856 
cik_get_2d_params(struct radeon_surface_manager * surf_man,unsigned bpe,unsigned nsamples,bool is_color,unsigned tile_mode,uint32_t * num_pipes,uint32_t * tile_split_ptr,uint32_t * num_banks,uint32_t * macro_tile_aspect,uint32_t * bank_w,uint32_t * bank_h)1857 static void cik_get_2d_params(struct radeon_surface_manager *surf_man,
1858                               unsigned bpe, unsigned nsamples, bool is_color,
1859                               unsigned tile_mode,
1860                               uint32_t *num_pipes,
1861                               uint32_t *tile_split_ptr,
1862                               uint32_t *num_banks,
1863                               uint32_t *macro_tile_aspect,
1864                               uint32_t *bank_w,
1865                               uint32_t *bank_h)
1866 {
1867     uint32_t gb_tile_mode = surf_man->hw_info.tile_mode_array[tile_mode];
1868     unsigned tileb_1x, tileb;
1869     unsigned gb_macrotile_mode;
1870     unsigned macrotile_index;
1871     unsigned tile_split, sample_split;
1872 
1873     if (num_pipes) {
1874         switch (CIK__GB_TILE_MODE__PIPE_CONFIG(gb_tile_mode)) {
1875         case CIK__PIPE_CONFIG__ADDR_SURF_P2:
1876         default:
1877             *num_pipes = 2;
1878             break;
1879         case CIK__PIPE_CONFIG__ADDR_SURF_P4_8x16:
1880         case CIK__PIPE_CONFIG__ADDR_SURF_P4_16x16:
1881         case CIK__PIPE_CONFIG__ADDR_SURF_P4_16x32:
1882         case CIK__PIPE_CONFIG__ADDR_SURF_P4_32x32:
1883             *num_pipes = 4;
1884             break;
1885         case CIK__PIPE_CONFIG__ADDR_SURF_P8_16x16_8x16:
1886         case CIK__PIPE_CONFIG__ADDR_SURF_P8_16x32_8x16:
1887         case CIK__PIPE_CONFIG__ADDR_SURF_P8_32x32_8x16:
1888         case CIK__PIPE_CONFIG__ADDR_SURF_P8_16x32_16x16:
1889         case CIK__PIPE_CONFIG__ADDR_SURF_P8_32x32_16x16:
1890         case CIK__PIPE_CONFIG__ADDR_SURF_P8_32x32_16x32:
1891         case CIK__PIPE_CONFIG__ADDR_SURF_P8_32x64_32x32:
1892             *num_pipes = 8;
1893             break;
1894         case CIK__PIPE_CONFIG__ADDR_SURF_P16_32X32_8X16:
1895         case CIK__PIPE_CONFIG__ADDR_SURF_P16_32X32_16X16:
1896             *num_pipes = 16;
1897             break;
1898         }
1899     }
1900     switch (CIK__GB_TILE_MODE__TILE_SPLIT(gb_tile_mode)) {
1901     default:
1902     case CIK__TILE_SPLIT__64B:
1903         tile_split = 64;
1904         break;
1905     case CIK__TILE_SPLIT__128B:
1906         tile_split = 128;
1907         break;
1908     case CIK__TILE_SPLIT__256B:
1909         tile_split = 256;
1910         break;
1911     case CIK__TILE_SPLIT__512B:
1912         tile_split = 512;
1913         break;
1914     case CIK__TILE_SPLIT__1024B:
1915         tile_split = 1024;
1916         break;
1917     case CIK__TILE_SPLIT__2048B:
1918         tile_split = 2048;
1919         break;
1920     case CIK__TILE_SPLIT__4096B:
1921         tile_split = 4096;
1922         break;
1923     }
1924     switch (CIK__GB_TILE_MODE__SAMPLE_SPLIT(gb_tile_mode)) {
1925     default:
1926     case CIK__SAMPLE_SPLIT__1:
1927         sample_split = 1;
1928         break;
1929     case CIK__SAMPLE_SPLIT__2:
1930         sample_split = 2;
1931         break;
1932     case CIK__SAMPLE_SPLIT__4:
1933         sample_split = 4;
1934         break;
1935     case CIK__SAMPLE_SPLIT__8:
1936         sample_split = 8;
1937         break;
1938     }
1939 
1940     /* Adjust the tile split. */
1941     tileb_1x = 8 * 8 * bpe;
1942     if (is_color) {
1943         tile_split = MAX2(256, sample_split * tileb_1x);
1944     }
1945     tile_split = MIN2(surf_man->hw_info.row_size, tile_split);
1946 
1947     /* Determine the macrotile index. */
1948     tileb = MIN2(tile_split, nsamples * tileb_1x);
1949 
1950     for (macrotile_index = 0; tileb > 64; macrotile_index++) {
1951         tileb >>= 1;
1952     }
1953     gb_macrotile_mode = surf_man->hw_info.macrotile_mode_array[macrotile_index];
1954 
1955     if (tile_split_ptr) {
1956         *tile_split_ptr = tile_split;
1957     }
1958     if (num_banks) {
1959         switch (CIK__GB_MACROTILE_MODE__NUM_BANKS(gb_macrotile_mode)) {
1960         default:
1961         case CIK__NUM_BANKS__2_BANK:
1962             *num_banks = 2;
1963             break;
1964         case CIK__NUM_BANKS__4_BANK:
1965             *num_banks = 4;
1966             break;
1967         case CIK__NUM_BANKS__8_BANK:
1968             *num_banks = 8;
1969             break;
1970         case CIK__NUM_BANKS__16_BANK:
1971             *num_banks = 16;
1972             break;
1973         }
1974     }
1975     if (macro_tile_aspect) {
1976         switch (CIK__GB_MACROTILE_MODE__MACRO_TILE_ASPECT(gb_macrotile_mode)) {
1977         default:
1978         case CIK__MACRO_TILE_ASPECT__1:
1979             *macro_tile_aspect = 1;
1980             break;
1981         case CIK__MACRO_TILE_ASPECT__2:
1982             *macro_tile_aspect = 2;
1983             break;
1984         case CIK__MACRO_TILE_ASPECT__4:
1985             *macro_tile_aspect = 4;
1986             break;
1987         case CIK__MACRO_TILE_ASPECT__8:
1988             *macro_tile_aspect = 8;
1989             break;
1990         }
1991     }
1992     if (bank_w) {
1993         switch (CIK__GB_MACROTILE_MODE__BANK_WIDTH(gb_macrotile_mode)) {
1994         default:
1995         case CIK__BANK_WIDTH__1:
1996             *bank_w = 1;
1997             break;
1998         case CIK__BANK_WIDTH__2:
1999             *bank_w = 2;
2000             break;
2001         case CIK__BANK_WIDTH__4:
2002             *bank_w = 4;
2003             break;
2004         case CIK__BANK_WIDTH__8:
2005             *bank_w = 8;
2006             break;
2007         }
2008     }
2009     if (bank_h) {
2010         switch (CIK__GB_MACROTILE_MODE__BANK_HEIGHT(gb_macrotile_mode)) {
2011         default:
2012         case CIK__BANK_HEIGHT__1:
2013             *bank_h = 1;
2014             break;
2015         case CIK__BANK_HEIGHT__2:
2016             *bank_h = 2;
2017             break;
2018         case CIK__BANK_HEIGHT__4:
2019             *bank_h = 4;
2020             break;
2021         case CIK__BANK_HEIGHT__8:
2022             *bank_h = 8;
2023             break;
2024         }
2025     }
2026 }
2027 
cik_init_hw_info(struct radeon_surface_manager * surf_man)2028 static int cik_init_hw_info(struct radeon_surface_manager *surf_man)
2029 {
2030     uint32_t tiling_config;
2031     drmVersionPtr version;
2032     int r;
2033 
2034     r = radeon_get_value(surf_man->fd, RADEON_INFO_TILING_CONFIG,
2035                          &tiling_config);
2036     if (r) {
2037         return r;
2038     }
2039 
2040     surf_man->hw_info.allow_2d = 0;
2041     version = drmGetVersion(surf_man->fd);
2042     if (version && version->version_minor >= 35) {
2043         if (!radeon_get_value(surf_man->fd, RADEON_INFO_SI_TILE_MODE_ARRAY, surf_man->hw_info.tile_mode_array) &&
2044 	    !radeon_get_value(surf_man->fd, RADEON_INFO_CIK_MACROTILE_MODE_ARRAY, surf_man->hw_info.macrotile_mode_array)) {
2045             surf_man->hw_info.allow_2d = 1;
2046         }
2047     }
2048     drmFreeVersion(version);
2049 
2050     switch (tiling_config & 0xf) {
2051     case 0:
2052         surf_man->hw_info.num_pipes = 1;
2053         break;
2054     case 1:
2055         surf_man->hw_info.num_pipes = 2;
2056         break;
2057     case 2:
2058         surf_man->hw_info.num_pipes = 4;
2059         break;
2060     case 3:
2061         surf_man->hw_info.num_pipes = 8;
2062         break;
2063     default:
2064         surf_man->hw_info.num_pipes = 8;
2065         surf_man->hw_info.allow_2d = 0;
2066         break;
2067     }
2068 
2069     switch ((tiling_config & 0xf0) >> 4) {
2070     case 0:
2071         surf_man->hw_info.num_banks = 4;
2072         break;
2073     case 1:
2074         surf_man->hw_info.num_banks = 8;
2075         break;
2076     case 2:
2077         surf_man->hw_info.num_banks = 16;
2078         break;
2079     default:
2080         surf_man->hw_info.num_banks = 8;
2081         surf_man->hw_info.allow_2d = 0;
2082         break;
2083     }
2084 
2085     switch ((tiling_config & 0xf00) >> 8) {
2086     case 0:
2087         surf_man->hw_info.group_bytes = 256;
2088         break;
2089     case 1:
2090         surf_man->hw_info.group_bytes = 512;
2091         break;
2092     default:
2093         surf_man->hw_info.group_bytes = 256;
2094         surf_man->hw_info.allow_2d = 0;
2095         break;
2096     }
2097 
2098     switch ((tiling_config & 0xf000) >> 12) {
2099     case 0:
2100         surf_man->hw_info.row_size = 1024;
2101         break;
2102     case 1:
2103         surf_man->hw_info.row_size = 2048;
2104         break;
2105     case 2:
2106         surf_man->hw_info.row_size = 4096;
2107         break;
2108     default:
2109         surf_man->hw_info.row_size = 4096;
2110         surf_man->hw_info.allow_2d = 0;
2111         break;
2112     }
2113     return 0;
2114 }
2115 
cik_surface_sanity(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,unsigned mode,unsigned * tile_mode,unsigned * stencil_tile_mode)2116 static int cik_surface_sanity(struct radeon_surface_manager *surf_man,
2117                               struct radeon_surface *surf,
2118                               unsigned mode, unsigned *tile_mode, unsigned *stencil_tile_mode)
2119 {
2120     /* check surface dimension */
2121     if (surf->npix_x > 16384 || surf->npix_y > 16384 || surf->npix_z > 16384) {
2122         return -EINVAL;
2123     }
2124 
2125     /* check mipmap last_level */
2126     if (surf->last_level > 15) {
2127         return -EINVAL;
2128     }
2129 
2130     /* force 1d on kernel that can't do 2d */
2131     if (mode > RADEON_SURF_MODE_1D &&
2132         (!surf_man->hw_info.allow_2d || !(surf->flags & RADEON_SURF_HAS_TILE_MODE_INDEX))) {
2133         if (surf->nsamples > 1) {
2134             fprintf(stderr, "radeon: Cannot use 1D tiling for an MSAA surface (%i).\n", __LINE__);
2135             return -EFAULT;
2136         }
2137         mode = RADEON_SURF_MODE_1D;
2138         surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
2139         surf->flags |= RADEON_SURF_SET(mode, MODE);
2140     }
2141 
2142     if (surf->nsamples > 1 && mode != RADEON_SURF_MODE_2D) {
2143         return -EINVAL;
2144     }
2145 
2146     if (!surf->tile_split) {
2147         /* default value */
2148         surf->mtilea = 1;
2149         surf->bankw = 1;
2150         surf->bankh = 1;
2151         surf->tile_split = 64;
2152         surf->stencil_tile_split = 64;
2153     }
2154 
2155     switch (mode) {
2156     case RADEON_SURF_MODE_2D: {
2157         if (surf->flags & RADEON_SURF_Z_OR_SBUFFER) {
2158             switch (surf->nsamples) {
2159             case 1:
2160                 *tile_mode = CIK_TILE_MODE_DEPTH_STENCIL_2D_TILESPLIT_64;
2161                 break;
2162             case 2:
2163             case 4:
2164                 *tile_mode = CIK_TILE_MODE_DEPTH_STENCIL_2D_TILESPLIT_128;
2165                 break;
2166             case 8:
2167                 *tile_mode = CIK_TILE_MODE_DEPTH_STENCIL_2D_TILESPLIT_256;
2168                 break;
2169             default:
2170                 return -EINVAL;
2171             }
2172 
2173             if (surf->flags & RADEON_SURF_SBUFFER) {
2174                 *stencil_tile_mode = *tile_mode;
2175 
2176                 cik_get_2d_params(surf_man, 1, surf->nsamples, false,
2177                                   *stencil_tile_mode, NULL,
2178                                   &surf->stencil_tile_split,
2179                                   NULL, NULL, NULL, NULL);
2180             }
2181         } else if (surf->flags & RADEON_SURF_SCANOUT) {
2182             *tile_mode = CIK_TILE_MODE_COLOR_2D_SCANOUT;
2183         } else {
2184             *tile_mode = CIK_TILE_MODE_COLOR_2D;
2185         }
2186 
2187         /* retrieve tiling mode values */
2188         cik_get_2d_params(surf_man, surf->bpe, surf->nsamples,
2189                           !(surf->flags & RADEON_SURF_Z_OR_SBUFFER), *tile_mode,
2190                           NULL, &surf->tile_split, NULL, &surf->mtilea,
2191                           &surf->bankw, &surf->bankh);
2192         break;
2193     }
2194     case RADEON_SURF_MODE_1D:
2195         if (surf->flags & RADEON_SURF_SBUFFER) {
2196             *stencil_tile_mode = CIK_TILE_MODE_DEPTH_STENCIL_1D;
2197         }
2198         if (surf->flags & RADEON_SURF_ZBUFFER) {
2199             *tile_mode = CIK_TILE_MODE_DEPTH_STENCIL_1D;
2200         } else if (surf->flags & RADEON_SURF_SCANOUT) {
2201             *tile_mode = SI_TILE_MODE_COLOR_1D_SCANOUT;
2202         } else {
2203             *tile_mode = SI_TILE_MODE_COLOR_1D;
2204         }
2205         break;
2206     case RADEON_SURF_MODE_LINEAR_ALIGNED:
2207     default:
2208         *tile_mode = SI_TILE_MODE_COLOR_LINEAR_ALIGNED;
2209     }
2210 
2211     return 0;
2212 }
2213 
cik_surface_init_2d(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,struct radeon_surface_level * level,unsigned bpe,unsigned tile_mode,unsigned tile_split,unsigned num_pipes,unsigned num_banks,uint64_t offset,unsigned start_level)2214 static int cik_surface_init_2d(struct radeon_surface_manager *surf_man,
2215                                struct radeon_surface *surf,
2216                                struct radeon_surface_level *level,
2217                                unsigned bpe, unsigned tile_mode,
2218                                unsigned tile_split,
2219                                unsigned num_pipes, unsigned num_banks,
2220                                uint64_t offset,
2221                                unsigned start_level)
2222 {
2223     uint64_t aligned_offset = offset;
2224     unsigned tilew, tileh, tileb_1x, tileb;
2225     unsigned mtilew, mtileh, mtileb;
2226     unsigned slice_pt;
2227     unsigned i;
2228 
2229     /* compute tile values */
2230     tilew = 8;
2231     tileh = 8;
2232     tileb_1x = tilew * tileh * bpe;
2233 
2234     tile_split = MIN2(surf_man->hw_info.row_size, tile_split);
2235 
2236     tileb = surf->nsamples * tileb_1x;
2237 
2238     /* slices per tile */
2239     slice_pt = 1;
2240     if (tileb > tile_split && tile_split) {
2241         slice_pt = tileb / tile_split;
2242         tileb = tileb / slice_pt;
2243     }
2244 
2245     /* macro tile width & height */
2246     mtilew = (tilew * surf->bankw * num_pipes) * surf->mtilea;
2247     mtileh = (tileh * surf->bankh * num_banks) / surf->mtilea;
2248 
2249     /* macro tile bytes */
2250     mtileb = (mtilew / tilew) * (mtileh / tileh) * tileb;
2251 
2252     if (start_level <= 1) {
2253         unsigned alignment = MAX2(256, mtileb);
2254         surf->bo_alignment = MAX2(surf->bo_alignment, alignment);
2255 
2256         if (aligned_offset) {
2257             aligned_offset = ALIGN(aligned_offset, alignment);
2258         }
2259     }
2260 
2261     /* build mipmap tree */
2262     for (i = start_level; i <= surf->last_level; i++) {
2263         level[i].mode = RADEON_SURF_MODE_2D;
2264         si_surf_minify_2d(surf, level+i, bpe, i, slice_pt, mtilew, mtileh, 1, mtileb, aligned_offset);
2265         if (level[i].mode == RADEON_SURF_MODE_1D) {
2266             switch (tile_mode) {
2267             case CIK_TILE_MODE_COLOR_2D:
2268                 tile_mode = SI_TILE_MODE_COLOR_1D;
2269                 break;
2270             case CIK_TILE_MODE_COLOR_2D_SCANOUT:
2271                 tile_mode = SI_TILE_MODE_COLOR_1D_SCANOUT;
2272                 break;
2273             case CIK_TILE_MODE_DEPTH_STENCIL_2D_TILESPLIT_64:
2274             case CIK_TILE_MODE_DEPTH_STENCIL_2D_TILESPLIT_128:
2275             case CIK_TILE_MODE_DEPTH_STENCIL_2D_TILESPLIT_256:
2276             case CIK_TILE_MODE_DEPTH_STENCIL_2D_TILESPLIT_512:
2277             case CIK_TILE_MODE_DEPTH_STENCIL_2D_TILESPLIT_ROW_SIZE:
2278                 tile_mode = CIK_TILE_MODE_DEPTH_STENCIL_1D;
2279                 break;
2280             default:
2281                 return -EINVAL;
2282             }
2283             return si_surface_init_1d(surf_man, surf, level, bpe, tile_mode, offset, i);
2284         }
2285         /* level0 and first mipmap need to have alignment */
2286         aligned_offset = offset = surf->bo_size;
2287         if (i == 0) {
2288             aligned_offset = ALIGN(aligned_offset, surf->bo_alignment);
2289         }
2290         if (surf->flags & RADEON_SURF_HAS_TILE_MODE_INDEX) {
2291             if (surf->level == level) {
2292                 surf->tiling_index[i] = tile_mode;
2293                 /* it's ok because stencil is done after */
2294                 surf->stencil_tiling_index[i] = tile_mode;
2295             } else {
2296                 surf->stencil_tiling_index[i] = tile_mode;
2297             }
2298         }
2299     }
2300     return 0;
2301 }
2302 
cik_surface_init_2d_miptrees(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,unsigned tile_mode,unsigned stencil_tile_mode)2303 static int cik_surface_init_2d_miptrees(struct radeon_surface_manager *surf_man,
2304                                         struct radeon_surface *surf,
2305                                         unsigned tile_mode, unsigned stencil_tile_mode)
2306 {
2307     int r;
2308     uint32_t num_pipes, num_banks;
2309 
2310     cik_get_2d_params(surf_man, surf->bpe, surf->nsamples,
2311                         !(surf->flags & RADEON_SURF_Z_OR_SBUFFER), tile_mode,
2312                         &num_pipes, NULL, &num_banks, NULL, NULL, NULL);
2313 
2314     r = cik_surface_init_2d(surf_man, surf, surf->level, surf->bpe, tile_mode,
2315                             surf->tile_split, num_pipes, num_banks, 0, 0);
2316     if (r) {
2317         return r;
2318     }
2319 
2320     if (surf->flags & RADEON_SURF_SBUFFER) {
2321         r = cik_surface_init_2d(surf_man, surf, surf->stencil_level, 1, stencil_tile_mode,
2322                                 surf->stencil_tile_split, num_pipes, num_banks,
2323                                 surf->bo_size, 0);
2324         surf->stencil_offset = surf->stencil_level[0].offset;
2325     }
2326     return r;
2327 }
2328 
cik_surface_init(struct radeon_surface_manager * surf_man,struct radeon_surface * surf)2329 static int cik_surface_init(struct radeon_surface_manager *surf_man,
2330                             struct radeon_surface *surf)
2331 {
2332     unsigned mode, tile_mode, stencil_tile_mode;
2333     int r;
2334 
2335     /* MSAA surfaces support the 2D mode only. */
2336     if (surf->nsamples > 1) {
2337         surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
2338         surf->flags |= RADEON_SURF_SET(RADEON_SURF_MODE_2D, MODE);
2339     }
2340 
2341     /* tiling mode */
2342     mode = (surf->flags >> RADEON_SURF_MODE_SHIFT) & RADEON_SURF_MODE_MASK;
2343 
2344     if (surf->flags & (RADEON_SURF_ZBUFFER | RADEON_SURF_SBUFFER)) {
2345         /* zbuffer only support 1D or 2D tiled surface */
2346         switch (mode) {
2347         case RADEON_SURF_MODE_1D:
2348         case RADEON_SURF_MODE_2D:
2349             break;
2350         default:
2351             mode = RADEON_SURF_MODE_1D;
2352             surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
2353             surf->flags |= RADEON_SURF_SET(RADEON_SURF_MODE_1D, MODE);
2354             break;
2355         }
2356     }
2357 
2358     r = cik_surface_sanity(surf_man, surf, mode, &tile_mode, &stencil_tile_mode);
2359     if (r) {
2360         return r;
2361     }
2362 
2363     surf->stencil_offset = 0;
2364     surf->bo_alignment = 0;
2365 
2366     /* check tiling mode */
2367     switch (mode) {
2368     case RADEON_SURF_MODE_LINEAR:
2369         r = r6_surface_init_linear(surf_man, surf, 0, 0);
2370         break;
2371     case RADEON_SURF_MODE_LINEAR_ALIGNED:
2372         r = si_surface_init_linear_aligned(surf_man, surf, tile_mode, 0, 0);
2373         break;
2374     case RADEON_SURF_MODE_1D:
2375         r = si_surface_init_1d_miptrees(surf_man, surf, tile_mode, stencil_tile_mode);
2376         break;
2377     case RADEON_SURF_MODE_2D:
2378         r = cik_surface_init_2d_miptrees(surf_man, surf, tile_mode, stencil_tile_mode);
2379         break;
2380     default:
2381         return -EINVAL;
2382     }
2383     return r;
2384 }
2385 
2386 /*
2387  * depending on surface
2388  */
cik_surface_best(struct radeon_surface_manager * surf_man,struct radeon_surface * surf)2389 static int cik_surface_best(struct radeon_surface_manager *surf_man,
2390                             struct radeon_surface *surf)
2391 {
2392     unsigned mode, tile_mode, stencil_tile_mode;
2393 
2394     /* tiling mode */
2395     mode = (surf->flags >> RADEON_SURF_MODE_SHIFT) & RADEON_SURF_MODE_MASK;
2396 
2397     if (surf->flags & (RADEON_SURF_ZBUFFER | RADEON_SURF_SBUFFER) &&
2398         !(surf->flags & RADEON_SURF_HAS_TILE_MODE_INDEX)) {
2399         /* depth/stencil force 1d tiling for old mesa */
2400         surf->flags = RADEON_SURF_CLR(surf->flags, MODE);
2401         surf->flags |= RADEON_SURF_SET(RADEON_SURF_MODE_1D, MODE);
2402     }
2403 
2404     return cik_surface_sanity(surf_man, surf, mode, &tile_mode, &stencil_tile_mode);
2405 }
2406 
2407 
2408 /* ===========================================================================
2409  * public API
2410  */
2411 drm_public struct radeon_surface_manager *
radeon_surface_manager_new(int fd)2412 radeon_surface_manager_new(int fd)
2413 {
2414     struct radeon_surface_manager *surf_man;
2415 
2416     surf_man = calloc(1, sizeof(struct radeon_surface_manager));
2417     if (surf_man == NULL) {
2418         return NULL;
2419     }
2420     surf_man->fd = fd;
2421     if (radeon_get_value(fd, RADEON_INFO_DEVICE_ID, &surf_man->device_id)) {
2422         goto out_err;
2423     }
2424     if (radeon_get_family(surf_man)) {
2425         goto out_err;
2426     }
2427 
2428     if (surf_man->family <= CHIP_RV740) {
2429         if (r6_init_hw_info(surf_man)) {
2430             goto out_err;
2431         }
2432         surf_man->surface_init = &r6_surface_init;
2433         surf_man->surface_best = &r6_surface_best;
2434     } else if (surf_man->family <= CHIP_ARUBA) {
2435         if (eg_init_hw_info(surf_man)) {
2436             goto out_err;
2437         }
2438         surf_man->surface_init = &eg_surface_init;
2439         surf_man->surface_best = &eg_surface_best;
2440     } else if (surf_man->family < CHIP_BONAIRE) {
2441         if (si_init_hw_info(surf_man)) {
2442             goto out_err;
2443         }
2444         surf_man->surface_init = &si_surface_init;
2445         surf_man->surface_best = &si_surface_best;
2446     } else {
2447         if (cik_init_hw_info(surf_man)) {
2448             goto out_err;
2449         }
2450         surf_man->surface_init = &cik_surface_init;
2451         surf_man->surface_best = &cik_surface_best;
2452     }
2453 
2454     return surf_man;
2455 out_err:
2456     free(surf_man);
2457     return NULL;
2458 }
2459 
2460 drm_public void
radeon_surface_manager_free(struct radeon_surface_manager * surf_man)2461 radeon_surface_manager_free(struct radeon_surface_manager *surf_man)
2462 {
2463     free(surf_man);
2464 }
2465 
radeon_surface_sanity(struct radeon_surface_manager * surf_man,struct radeon_surface * surf,unsigned type,unsigned mode)2466 static int radeon_surface_sanity(struct radeon_surface_manager *surf_man,
2467                                  struct radeon_surface *surf,
2468                                  unsigned type,
2469                                  unsigned mode)
2470 {
2471     if (surf_man == NULL || surf_man->surface_init == NULL || surf == NULL) {
2472         return -EINVAL;
2473     }
2474 
2475     /* all dimension must be at least 1 ! */
2476     if (!surf->npix_x || !surf->npix_y || !surf->npix_z) {
2477         return -EINVAL;
2478     }
2479     if (!surf->blk_w || !surf->blk_h || !surf->blk_d) {
2480         return -EINVAL;
2481     }
2482     if (!surf->array_size) {
2483         return -EINVAL;
2484     }
2485     /* array size must be a power of 2 */
2486     surf->array_size = next_power_of_two(surf->array_size);
2487 
2488     switch (surf->nsamples) {
2489     case 1:
2490     case 2:
2491     case 4:
2492     case 8:
2493         break;
2494     default:
2495         return -EINVAL;
2496     }
2497     /* check type */
2498     switch (type) {
2499     case RADEON_SURF_TYPE_1D:
2500         if (surf->npix_y > 1) {
2501             return -EINVAL;
2502         }
2503         /* fallthrough */
2504     case RADEON_SURF_TYPE_2D:
2505         if (surf->npix_z > 1) {
2506             return -EINVAL;
2507         }
2508         break;
2509     case RADEON_SURF_TYPE_CUBEMAP:
2510         if (surf->npix_z > 1) {
2511             return -EINVAL;
2512         }
2513         /* deal with cubemap as they were texture array */
2514         if (surf_man->family >= CHIP_RV770) {
2515             surf->array_size = 8;
2516         } else {
2517             surf->array_size = 6;
2518         }
2519         break;
2520     case RADEON_SURF_TYPE_3D:
2521         break;
2522     case RADEON_SURF_TYPE_1D_ARRAY:
2523         if (surf->npix_y > 1) {
2524             return -EINVAL;
2525         }
2526     case RADEON_SURF_TYPE_2D_ARRAY:
2527         break;
2528     default:
2529         return -EINVAL;
2530     }
2531     return 0;
2532 }
2533 
2534 drm_public int
radeon_surface_init(struct radeon_surface_manager * surf_man,struct radeon_surface * surf)2535 radeon_surface_init(struct radeon_surface_manager *surf_man,
2536                     struct radeon_surface *surf)
2537 {
2538     unsigned mode, type;
2539     int r;
2540 
2541     type = RADEON_SURF_GET(surf->flags, TYPE);
2542     mode = RADEON_SURF_GET(surf->flags, MODE);
2543 
2544     r = radeon_surface_sanity(surf_man, surf, type, mode);
2545     if (r) {
2546         return r;
2547     }
2548     return surf_man->surface_init(surf_man, surf);
2549 }
2550 
2551 drm_public int
radeon_surface_best(struct radeon_surface_manager * surf_man,struct radeon_surface * surf)2552 radeon_surface_best(struct radeon_surface_manager *surf_man,
2553                     struct radeon_surface *surf)
2554 {
2555     unsigned mode, type;
2556     int r;
2557 
2558     type = RADEON_SURF_GET(surf->flags, TYPE);
2559     mode = RADEON_SURF_GET(surf->flags, MODE);
2560 
2561     r = radeon_surface_sanity(surf_man, surf, type, mode);
2562     if (r) {
2563         return r;
2564     }
2565     return surf_man->surface_best(surf_man, surf);
2566 }
2567