1 /**********************************************************
2  * Copyright 2008-2009 VMware, Inc.  All rights reserved.
3  *
4  * Permission is hereby granted, free of charge, to any person
5  * obtaining a copy of this software and associated documentation
6  * files (the "Software"), to deal in the Software without
7  * restriction, including without limitation the rights to use, copy,
8  * modify, merge, publish, distribute, sublicense, and/or sell copies
9  * of the Software, and to permit persons to whom the Software is
10  * furnished to do so, subject to the following conditions:
11  *
12  * The above copyright notice and this permission notice shall be
13  * included in all copies or substantial portions of the Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22  * SOFTWARE.
23  *
24  **********************************************************/
25 
26 #include "svga_cmd.h"
27 
28 #include "pipe/p_state.h"
29 #include "pipe/p_defines.h"
30 #include "util/u_inlines.h"
31 #include "os/os_thread.h"
32 #include "util/u_format.h"
33 #include "util/u_math.h"
34 #include "util/u_memory.h"
35 
36 #include "svga_format.h"
37 #include "svga_screen.h"
38 #include "svga_context.h"
39 #include "svga_resource_texture.h"
40 #include "svga_resource_buffer.h"
41 #include "svga_sampler_view.h"
42 #include "svga_winsys.h"
43 #include "svga_debug.h"
44 
45 
46 /* XXX: This isn't a real hardware flag, but just a hack for kernel to
47  * know about primary surfaces. Find a better way to accomplish this.
48  */
49 #define SVGA3D_SURFACE_HINT_SCANOUT (1 << 9)
50 
51 
52 static INLINE void
svga_transfer_dma_band(struct svga_context * svga,struct svga_transfer * st,SVGA3dTransferType transfer,unsigned y,unsigned h,unsigned srcy,SVGA3dSurfaceDMAFlags flags)53 svga_transfer_dma_band(struct svga_context *svga,
54                        struct svga_transfer *st,
55                        SVGA3dTransferType transfer,
56                        unsigned y, unsigned h, unsigned srcy,
57                        SVGA3dSurfaceDMAFlags flags)
58 {
59    struct svga_texture *texture = svga_texture(st->base.resource);
60    SVGA3dCopyBox box;
61    enum pipe_error ret;
62 
63    box.x = st->base.box.x;
64    box.y = y;
65    box.z = st->base.box.z;
66    box.w = st->base.box.width;
67    box.h = h;
68    box.d = 1;
69    box.srcx = 0;
70    box.srcy = srcy;
71    box.srcz = 0;
72 
73    if (st->base.resource->target == PIPE_TEXTURE_CUBE) {
74       st->face = st->base.box.z;
75       box.z = 0;
76    }
77    else
78       st->face = 0;
79 
80    SVGA_DBG(DEBUG_DMA, "dma %s sid %p, face %u, (%u, %u, %u) - (%u, %u, %u), %ubpp\n",
81                 transfer == SVGA3D_WRITE_HOST_VRAM ? "to" : "from",
82                 texture->handle,
83                 st->face,
84                 st->base.box.x,
85                 y,
86                 box.z,
87                 st->base.box.x + st->base.box.width,
88                 y + h,
89                 box.z + 1,
90                 util_format_get_blocksize(texture->b.b.format) * 8 /
91                 (util_format_get_blockwidth(texture->b.b.format)*util_format_get_blockheight(texture->b.b.format)));
92 
93    ret = SVGA3D_SurfaceDMA(svga->swc, st, transfer, &box, 1, flags);
94    if(ret != PIPE_OK) {
95       svga_context_flush(svga, NULL);
96       ret = SVGA3D_SurfaceDMA(svga->swc, st, transfer, &box, 1, flags);
97       assert(ret == PIPE_OK);
98    }
99 }
100 
101 
102 static INLINE void
svga_transfer_dma(struct svga_context * svga,struct svga_transfer * st,SVGA3dTransferType transfer,SVGA3dSurfaceDMAFlags flags)103 svga_transfer_dma(struct svga_context *svga,
104                   struct svga_transfer *st,
105                   SVGA3dTransferType transfer,
106                   SVGA3dSurfaceDMAFlags flags)
107 {
108    struct svga_texture *texture = svga_texture(st->base.resource);
109    struct svga_screen *screen = svga_screen(texture->b.b.screen);
110    struct svga_winsys_screen *sws = screen->sws;
111    struct pipe_fence_handle *fence = NULL;
112 
113    if (transfer == SVGA3D_READ_HOST_VRAM) {
114       SVGA_DBG(DEBUG_PERF, "%s: readback transfer\n", __FUNCTION__);
115    }
116 
117    /* Ensure any pending operations on host surfaces are queued on the command
118     * buffer first.
119     */
120    svga_surfaces_flush( svga );
121 
122    if(!st->swbuf) {
123       /* Do the DMA transfer in a single go */
124 
125       svga_transfer_dma_band(svga, st, transfer,
126                              st->base.box.y, st->base.box.height, 0,
127                              flags);
128 
129       if(transfer == SVGA3D_READ_HOST_VRAM) {
130          svga_context_flush(svga, &fence);
131          sws->fence_finish(sws, fence, 0);
132          sws->fence_reference(sws, &fence, NULL);
133       }
134    }
135    else {
136       unsigned y, h, srcy;
137       unsigned blockheight = util_format_get_blockheight(st->base.resource->format);
138       h = st->hw_nblocksy * blockheight;
139       srcy = 0;
140       for(y = 0; y < st->base.box.height; y += h) {
141          unsigned offset, length;
142          void *hw, *sw;
143 
144          if (y + h > st->base.box.height)
145             h = st->base.box.height - y;
146 
147          /* Transfer band must be aligned to pixel block boundaries */
148          assert(y % blockheight == 0);
149          assert(h % blockheight == 0);
150 
151          offset = y * st->base.stride / blockheight;
152          length = h * st->base.stride / blockheight;
153 
154          sw = (uint8_t *)st->swbuf + offset;
155 
156          if (transfer == SVGA3D_WRITE_HOST_VRAM) {
157             unsigned usage = PIPE_TRANSFER_WRITE;
158 
159             /* Wait for the previous DMAs to complete */
160             /* TODO: keep one DMA (at half the size) in the background */
161             if (y) {
162                svga_context_flush(svga, NULL);
163                usage |= PIPE_TRANSFER_DISCARD_WHOLE_RESOURCE;
164             }
165 
166             hw = sws->buffer_map(sws, st->hwbuf, usage);
167             assert(hw);
168             if (hw) {
169                memcpy(hw, sw, length);
170                sws->buffer_unmap(sws, st->hwbuf);
171             }
172          }
173 
174          svga_transfer_dma_band(svga, st, transfer, y, h, srcy, flags);
175 
176          /*
177           * Prevent the texture contents to be discarded on the next band
178           * upload.
179           */
180 
181          flags.discard = FALSE;
182 
183          if(transfer == SVGA3D_READ_HOST_VRAM) {
184             svga_context_flush(svga, &fence);
185             sws->fence_finish(sws, fence, 0);
186 
187             hw = sws->buffer_map(sws, st->hwbuf, PIPE_TRANSFER_READ);
188             assert(hw);
189             if(hw) {
190                memcpy(sw, hw, length);
191                sws->buffer_unmap(sws, st->hwbuf);
192             }
193          }
194       }
195    }
196 }
197 
198 
199 static boolean
svga_texture_get_handle(struct pipe_screen * screen,struct pipe_resource * texture,struct winsys_handle * whandle)200 svga_texture_get_handle(struct pipe_screen *screen,
201                                struct pipe_resource *texture,
202                                struct winsys_handle *whandle)
203 {
204    struct svga_winsys_screen *sws = svga_winsys_screen(texture->screen);
205    unsigned stride;
206 
207    assert(svga_texture(texture)->key.cachable == 0);
208    svga_texture(texture)->key.cachable = 0;
209    stride = util_format_get_nblocksx(texture->format, texture->width0) *
210             util_format_get_blocksize(texture->format);
211    return sws->surface_get_handle(sws, svga_texture(texture)->handle, stride, whandle);
212 }
213 
214 
215 static void
svga_texture_destroy(struct pipe_screen * screen,struct pipe_resource * pt)216 svga_texture_destroy(struct pipe_screen *screen,
217 		     struct pipe_resource *pt)
218 {
219    struct svga_screen *ss = svga_screen(screen);
220    struct svga_texture *tex = (struct svga_texture *)pt;
221 
222    ss->texture_timestamp++;
223 
224    svga_sampler_view_reference(&tex->cached_view, NULL);
225 
226    /*
227      DBG("%s deleting %p\n", __FUNCTION__, (void *) tex);
228    */
229    SVGA_DBG(DEBUG_DMA, "unref sid %p (texture)\n", tex->handle);
230    svga_screen_surface_destroy(ss, &tex->key, &tex->handle);
231 
232    FREE(tex);
233 }
234 
235 
236 /* XXX: Still implementing this as if it was a screen function, but
237  * can now modify it to queue transfers on the context.
238  */
239 static struct pipe_transfer *
svga_texture_get_transfer(struct pipe_context * pipe,struct pipe_resource * texture,unsigned level,unsigned usage,const struct pipe_box * box)240 svga_texture_get_transfer(struct pipe_context *pipe,
241                           struct pipe_resource *texture,
242                           unsigned level,
243                           unsigned usage,
244                           const struct pipe_box *box)
245 {
246    struct svga_context *svga = svga_context(pipe);
247    struct svga_screen *ss = svga_screen(pipe->screen);
248    struct svga_winsys_screen *sws = ss->sws;
249    struct svga_transfer *st;
250    unsigned nblocksx = util_format_get_nblocksx(texture->format, box->width);
251    unsigned nblocksy = util_format_get_nblocksy(texture->format, box->height);
252 
253    /* We can't map texture storage directly */
254    if (usage & PIPE_TRANSFER_MAP_DIRECTLY)
255       return NULL;
256 
257    assert(box->depth == 1);
258    st = CALLOC_STRUCT(svga_transfer);
259    if (!st)
260       return NULL;
261 
262    pipe_resource_reference(&st->base.resource, texture);
263    st->base.level = level;
264    st->base.usage = usage;
265    st->base.box = *box;
266    st->base.stride = nblocksx*util_format_get_blocksize(texture->format);
267    st->base.layer_stride = 0;
268 
269    st->hw_nblocksy = nblocksy;
270 
271    st->hwbuf = svga_winsys_buffer_create(svga,
272                                          1,
273                                          0,
274                                          st->hw_nblocksy*st->base.stride);
275    while(!st->hwbuf && (st->hw_nblocksy /= 2)) {
276       st->hwbuf = svga_winsys_buffer_create(svga,
277                                             1,
278                                             0,
279                                             st->hw_nblocksy*st->base.stride);
280    }
281 
282    if(!st->hwbuf)
283       goto no_hwbuf;
284 
285    if(st->hw_nblocksy < nblocksy) {
286       /* We couldn't allocate a hardware buffer big enough for the transfer,
287        * so allocate regular malloc memory instead */
288       if (0) {
289          debug_printf("%s: failed to allocate %u KB of DMA, "
290                       "splitting into %u x %u KB DMA transfers\n",
291                       __FUNCTION__,
292                       (nblocksy*st->base.stride + 1023)/1024,
293                       (nblocksy + st->hw_nblocksy - 1)/st->hw_nblocksy,
294                       (st->hw_nblocksy*st->base.stride + 1023)/1024);
295       }
296 
297       st->swbuf = MALLOC(nblocksy*st->base.stride);
298       if(!st->swbuf)
299          goto no_swbuf;
300    }
301 
302    if (usage & PIPE_TRANSFER_READ) {
303       SVGA3dSurfaceDMAFlags flags;
304       memset(&flags, 0, sizeof flags);
305       svga_transfer_dma(svga, st, SVGA3D_READ_HOST_VRAM, flags);
306    }
307 
308    return &st->base;
309 
310 no_swbuf:
311    sws->buffer_destroy(sws, st->hwbuf);
312 no_hwbuf:
313    FREE(st);
314    return NULL;
315 }
316 
317 
318 /* XXX: Still implementing this as if it was a screen function, but
319  * can now modify it to queue transfers on the context.
320  */
321 static void *
svga_texture_transfer_map(struct pipe_context * pipe,struct pipe_transfer * transfer)322 svga_texture_transfer_map( struct pipe_context *pipe,
323 			   struct pipe_transfer *transfer )
324 {
325    struct svga_screen *ss = svga_screen(pipe->screen);
326    struct svga_winsys_screen *sws = ss->sws;
327    struct svga_transfer *st = svga_transfer(transfer);
328 
329    if(st->swbuf)
330       return st->swbuf;
331    else
332       /* The wait for read transfers already happened when svga_transfer_dma
333        * was called. */
334       return sws->buffer_map(sws, st->hwbuf, transfer->usage);
335 }
336 
337 
338 /* XXX: Still implementing this as if it was a screen function, but
339  * can now modify it to queue transfers on the context.
340  */
341 static void
svga_texture_transfer_unmap(struct pipe_context * pipe,struct pipe_transfer * transfer)342 svga_texture_transfer_unmap(struct pipe_context *pipe,
343 			    struct pipe_transfer *transfer)
344 {
345    struct svga_screen *ss = svga_screen(pipe->screen);
346    struct svga_winsys_screen *sws = ss->sws;
347    struct svga_transfer *st = svga_transfer(transfer);
348 
349    if(!st->swbuf)
350       sws->buffer_unmap(sws, st->hwbuf);
351 }
352 
353 
354 static void
svga_texture_transfer_destroy(struct pipe_context * pipe,struct pipe_transfer * transfer)355 svga_texture_transfer_destroy(struct pipe_context *pipe,
356 			      struct pipe_transfer *transfer)
357 {
358    struct svga_context *svga = svga_context(pipe);
359    struct svga_texture *tex = svga_texture(transfer->resource);
360    struct svga_screen *ss = svga_screen(pipe->screen);
361    struct svga_winsys_screen *sws = ss->sws;
362    struct svga_transfer *st = svga_transfer(transfer);
363 
364    if (st->base.usage & PIPE_TRANSFER_WRITE) {
365       SVGA3dSurfaceDMAFlags flags;
366 
367       memset(&flags, 0, sizeof flags);
368       if (transfer->usage & PIPE_TRANSFER_DISCARD_WHOLE_RESOURCE) {
369          flags.discard = TRUE;
370       }
371       if (transfer->usage & PIPE_TRANSFER_UNSYNCHRONIZED) {
372          flags.unsynchronized = TRUE;
373       }
374 
375       svga_transfer_dma(svga, st, SVGA3D_WRITE_HOST_VRAM, flags);
376       ss->texture_timestamp++;
377       tex->view_age[transfer->level] = ++(tex->age);
378       if (transfer->resource->target == PIPE_TEXTURE_CUBE)
379          tex->defined[transfer->box.z][transfer->level] = TRUE;
380       else
381          tex->defined[0][transfer->level] = TRUE;
382    }
383 
384    pipe_resource_reference(&st->base.resource, NULL);
385    FREE(st->swbuf);
386    sws->buffer_destroy(sws, st->hwbuf);
387    FREE(st);
388 }
389 
390 
391 struct u_resource_vtbl svga_texture_vtbl =
392 {
393    svga_texture_get_handle,	      /* get_handle */
394    svga_texture_destroy,	      /* resource_destroy */
395    svga_texture_get_transfer,	      /* get_transfer */
396    svga_texture_transfer_destroy,     /* transfer_destroy */
397    svga_texture_transfer_map,	      /* transfer_map */
398    u_default_transfer_flush_region,   /* transfer_flush_region */
399    svga_texture_transfer_unmap,	      /* transfer_unmap */
400    u_default_transfer_inline_write    /* transfer_inline_write */
401 };
402 
403 
404 struct pipe_resource *
svga_texture_create(struct pipe_screen * screen,const struct pipe_resource * template)405 svga_texture_create(struct pipe_screen *screen,
406                     const struct pipe_resource *template)
407 {
408    struct svga_screen *svgascreen = svga_screen(screen);
409    struct svga_texture *tex = CALLOC_STRUCT(svga_texture);
410 
411    if (!tex)
412       goto error1;
413 
414    tex->b.b = *template;
415    tex->b.vtbl = &svga_texture_vtbl;
416    pipe_reference_init(&tex->b.b.reference, 1);
417    tex->b.b.screen = screen;
418 
419    assert(template->last_level < SVGA_MAX_TEXTURE_LEVELS);
420    if(template->last_level >= SVGA_MAX_TEXTURE_LEVELS)
421       goto error2;
422 
423    tex->key.flags = 0;
424    tex->key.size.width = template->width0;
425    tex->key.size.height = template->height0;
426    tex->key.size.depth = template->depth0;
427 
428    if(template->target == PIPE_TEXTURE_CUBE) {
429       tex->key.flags |= SVGA3D_SURFACE_CUBEMAP;
430       tex->key.numFaces = 6;
431    }
432    else {
433       tex->key.numFaces = 1;
434    }
435 
436    tex->key.cachable = 1;
437 
438    if (template->bind & PIPE_BIND_SAMPLER_VIEW)
439       tex->key.flags |= SVGA3D_SURFACE_HINT_TEXTURE;
440 
441    if (template->bind & PIPE_BIND_DISPLAY_TARGET) {
442       tex->key.cachable = 0;
443    }
444 
445    if (template->bind & PIPE_BIND_SHARED) {
446       tex->key.cachable = 0;
447    }
448 
449    if (template->bind & (PIPE_BIND_SCANOUT |
450                          PIPE_BIND_CURSOR)) {
451       tex->key.flags |= SVGA3D_SURFACE_HINT_SCANOUT;
452       tex->key.cachable = 0;
453    }
454 
455    /*
456     * Note: Previously we never passed the
457     * SVGA3D_SURFACE_HINT_RENDERTARGET hint. Mesa cannot
458     * know beforehand whether a texture will be used as a rendertarget or not
459     * and it always requests PIPE_BIND_RENDER_TARGET, therefore
460     * passing the SVGA3D_SURFACE_HINT_RENDERTARGET here defeats its purpose.
461     *
462     * However, this was changed since other state trackers
463     * (XA for example) uses it accurately and certain device versions
464     * relies on it in certain situations to render correctly.
465     */
466    if((template->bind & PIPE_BIND_RENDER_TARGET) &&
467       !util_format_is_s3tc(template->format))
468       tex->key.flags |= SVGA3D_SURFACE_HINT_RENDERTARGET;
469 
470    if(template->bind & PIPE_BIND_DEPTH_STENCIL)
471       tex->key.flags |= SVGA3D_SURFACE_HINT_DEPTHSTENCIL;
472 
473    tex->key.numMipLevels = template->last_level + 1;
474 
475    tex->key.format = svga_translate_format(svgascreen, template->format, template->bind);
476    if(tex->key.format == SVGA3D_FORMAT_INVALID)
477       goto error2;
478 
479    SVGA_DBG(DEBUG_DMA, "surface_create for texture\n", tex->handle);
480    tex->handle = svga_screen_surface_create(svgascreen, &tex->key);
481    if (tex->handle)
482       SVGA_DBG(DEBUG_DMA, "  --> got sid %p (texture)\n", tex->handle);
483 
484    debug_reference(&tex->b.b.reference,
485                    (debug_reference_descriptor)debug_describe_resource, 0);
486 
487    return &tex->b.b;
488 
489 error2:
490    FREE(tex);
491 error1:
492    return NULL;
493 }
494 
495 
496 struct pipe_resource *
svga_texture_from_handle(struct pipe_screen * screen,const struct pipe_resource * template,struct winsys_handle * whandle)497 svga_texture_from_handle(struct pipe_screen *screen,
498 			 const struct pipe_resource *template,
499 			 struct winsys_handle *whandle)
500 {
501    struct svga_winsys_screen *sws = svga_winsys_screen(screen);
502    struct svga_winsys_surface *srf;
503    struct svga_texture *tex;
504    enum SVGA3dSurfaceFormat format = 0;
505    assert(screen);
506 
507    /* Only supports one type */
508    if ((template->target != PIPE_TEXTURE_2D &&
509        template->target != PIPE_TEXTURE_RECT) ||
510        template->last_level != 0 ||
511        template->depth0 != 1) {
512       return NULL;
513    }
514 
515    srf = sws->surface_from_handle(sws, whandle, &format);
516 
517    if (!srf)
518       return NULL;
519 
520    if (svga_translate_format(svga_screen(screen), template->format, template->bind) != format) {
521       unsigned f1 = svga_translate_format(svga_screen(screen), template->format, template->bind);
522       unsigned f2 = format;
523 
524       /* It's okay for XRGB and ARGB or depth with/out stencil to get mixed up */
525       if ( !( (f1 == SVGA3D_X8R8G8B8 && f2 == SVGA3D_A8R8G8B8) ||
526               (f1 == SVGA3D_A8R8G8B8 && f2 == SVGA3D_X8R8G8B8) ||
527               (f1 == SVGA3D_Z_D24X8 && f2 == SVGA3D_Z_D24S8) ||
528               (f1 == SVGA3D_Z_DF24 && f2 == SVGA3D_Z_D24S8_INT) ) ) {
529          debug_printf("%s wrong format %u != %u\n", __FUNCTION__, f1, f2);
530          return NULL;
531       }
532    }
533 
534    tex = CALLOC_STRUCT(svga_texture);
535    if (!tex)
536       return NULL;
537 
538    tex->b.b = *template;
539    tex->b.vtbl = &svga_texture_vtbl;
540    pipe_reference_init(&tex->b.b.reference, 1);
541    tex->b.b.screen = screen;
542 
543    if (format == SVGA3D_X8R8G8B8)
544       tex->b.b.format = PIPE_FORMAT_B8G8R8X8_UNORM;
545    else if (format == SVGA3D_A8R8G8B8)
546       tex->b.b.format = PIPE_FORMAT_B8G8R8A8_UNORM;
547    else {
548       /* ?? */
549    }
550 
551    SVGA_DBG(DEBUG_DMA, "wrap surface sid %p\n", srf);
552 
553    tex->key.cachable = 0;
554    tex->handle = srf;
555 
556    return &tex->b.b;
557 }
558