1 /**********************************************************
2  * Copyright 2008-2009 VMware, Inc.  All rights reserved.
3  *
4  * Permission is hereby granted, free of charge, to any person
5  * obtaining a copy of this software and associated documentation
6  * files (the "Software"), to deal in the Software without
7  * restriction, including without limitation the rights to use, copy,
8  * modify, merge, publish, distribute, sublicense, and/or sell copies
9  * of the Software, and to permit persons to whom the Software is
10  * furnished to do so, subject to the following conditions:
11  *
12  * The above copyright notice and this permission notice shall be
13  * included in all copies or substantial portions of the Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22  * SOFTWARE.
23  *
24  **********************************************************/
25 
26 #include "util/u_inlines.h"
27 #include "util/u_prim.h"
28 #include "util/u_upload_mgr.h"
29 #include "indices/u_indices.h"
30 
31 #include "svga_cmd.h"
32 #include "svga_draw.h"
33 #include "svga_draw_private.h"
34 #include "svga_resource_buffer.h"
35 #include "svga_winsys.h"
36 #include "svga_context.h"
37 #include "svga_hw_reg.h"
38 
39 
40 /**
41  * Return a new index buffer which contains a translation of the original
42  * index buffer.  An example of a translation is converting from QUAD
43  * primitives to TRIANGLE primitives.  Each set of four indexes for a quad
44  * will be converted to six indices for two triangles.
45  *
46  * Before generating the new index buffer we'll check if the incoming
47  * buffer already has a translated buffer that can be re-used.
48  * This benefits demos like Cinebench R15 which has many
49  * glDrawElements(GL_QUADS) commands (we can't draw quads natively).
50  *
51  * \param offset  offset in bytes to first index to translate in src buffer
52  * \param orig_prim  original primitive type (like PIPE_PRIM_QUADS)
53  * \param gen_prim  new/generated primitive type (like PIPE_PRIM_TRIANGLES)
54  * \param orig_nr  number of indexes to translate in source buffer
55  * \param gen_nr  number of indexes to write into new/dest buffer
56  * \param index_size  bytes per index (2 or 4)
57  * \param translate  the translation function from the u_translate module
58  * \param out_buf  returns the new/translated index buffer
59  * \return error code to indicate success failure
60  */
61 static enum pipe_error
translate_indices(struct svga_hwtnl * hwtnl,struct pipe_resource * src,unsigned offset,enum pipe_prim_type orig_prim,enum pipe_prim_type gen_prim,unsigned orig_nr,unsigned gen_nr,unsigned index_size,u_translate_func translate,struct pipe_resource ** out_buf)62 translate_indices(struct svga_hwtnl *hwtnl, struct pipe_resource *src,
63                   unsigned offset,
64                   enum pipe_prim_type orig_prim, enum pipe_prim_type gen_prim,
65                   unsigned orig_nr, unsigned gen_nr,
66                   unsigned index_size,
67                   u_translate_func translate, struct pipe_resource **out_buf)
68 {
69    struct pipe_context *pipe = &hwtnl->svga->pipe;
70    struct svga_screen *screen = svga_screen(pipe->screen);
71    struct svga_buffer *src_sbuf = svga_buffer(src);
72    struct pipe_transfer *src_transfer = NULL;
73    struct pipe_transfer *dst_transfer = NULL;
74    unsigned size = index_size * gen_nr;
75    const void *src_map = NULL;
76    struct pipe_resource *dst = NULL;
77    void *dst_map = NULL;
78 
79    assert(index_size == 2 || index_size == 4);
80 
81    if (!screen->debug.no_cache_index_buffers) {
82       /* Check if we already have a translated index buffer */
83       if (src_sbuf->translated_indices.buffer &&
84           src_sbuf->translated_indices.orig_prim == orig_prim &&
85           src_sbuf->translated_indices.new_prim == gen_prim &&
86           src_sbuf->translated_indices.offset == offset &&
87           src_sbuf->translated_indices.count == orig_nr &&
88           src_sbuf->translated_indices.index_size == index_size) {
89          pipe_resource_reference(out_buf, src_sbuf->translated_indices.buffer);
90          return PIPE_OK;
91       }
92    }
93 
94    /* Need to trim vertex count to make sure we don't write too much data
95     * to the dst buffer in the translate() call.
96     */
97    u_trim_pipe_prim(gen_prim, &gen_nr);
98 
99    size = index_size * gen_nr;
100 
101    dst = pipe_buffer_create(pipe->screen,
102                             PIPE_BIND_INDEX_BUFFER, PIPE_USAGE_DEFAULT, size);
103    if (!dst)
104       goto fail;
105 
106    src_map = pipe_buffer_map(pipe, src, PIPE_TRANSFER_READ, &src_transfer);
107    if (!src_map)
108       goto fail;
109 
110    dst_map = pipe_buffer_map(pipe, dst, PIPE_TRANSFER_WRITE, &dst_transfer);
111    if (!dst_map)
112       goto fail;
113 
114    translate((const char *) src_map + offset, 0, 0, gen_nr, 0, dst_map);
115 
116    pipe_buffer_unmap(pipe, src_transfer);
117    pipe_buffer_unmap(pipe, dst_transfer);
118 
119    *out_buf = dst;
120 
121    if (!screen->debug.no_cache_index_buffers) {
122       /* Save the new, translated index buffer in the hope we can use it
123        * again in the future.
124        */
125       pipe_resource_reference(&src_sbuf->translated_indices.buffer, dst);
126       src_sbuf->translated_indices.orig_prim = orig_prim;
127       src_sbuf->translated_indices.new_prim = gen_prim;
128       src_sbuf->translated_indices.offset = offset;
129       src_sbuf->translated_indices.count = orig_nr;
130       src_sbuf->translated_indices.index_size = index_size;
131    }
132 
133    return PIPE_OK;
134 
135  fail:
136    if (src_map)
137       pipe_buffer_unmap(pipe, src_transfer);
138 
139    if (dst_map)
140       pipe_buffer_unmap(pipe, dst_transfer);
141 
142    if (dst)
143       pipe->screen->resource_destroy(pipe->screen, dst);
144 
145    return PIPE_ERROR_OUT_OF_MEMORY;
146 }
147 
148 
149 enum pipe_error
svga_hwtnl_simple_draw_range_elements(struct svga_hwtnl * hwtnl,struct pipe_resource * index_buffer,unsigned index_size,int index_bias,unsigned min_index,unsigned max_index,enum pipe_prim_type prim,unsigned start,unsigned count,unsigned start_instance,unsigned instance_count)150 svga_hwtnl_simple_draw_range_elements(struct svga_hwtnl *hwtnl,
151                                       struct pipe_resource *index_buffer,
152                                       unsigned index_size, int index_bias,
153                                       unsigned min_index, unsigned max_index,
154                                       enum pipe_prim_type prim, unsigned start,
155                                       unsigned count,
156                                       unsigned start_instance,
157                                       unsigned instance_count)
158 {
159    SVGA3dPrimitiveRange range;
160    unsigned hw_prim;
161    unsigned hw_count;
162    unsigned index_offset = start * index_size;
163 
164    hw_prim = svga_translate_prim(prim, count, &hw_count);
165    if (hw_count == 0)
166       return PIPE_OK; /* nothing to draw */
167 
168    range.primType = hw_prim;
169    range.primitiveCount = hw_count;
170    range.indexArray.offset = index_offset;
171    range.indexArray.stride = index_size;
172    range.indexWidth = index_size;
173    range.indexBias = index_bias;
174 
175    return svga_hwtnl_prim(hwtnl, &range, count,
176                           min_index, max_index, index_buffer,
177                           start_instance, instance_count);
178 }
179 
180 
181 enum pipe_error
svga_hwtnl_draw_range_elements(struct svga_hwtnl * hwtnl,struct pipe_resource * index_buffer,unsigned index_size,int index_bias,unsigned min_index,unsigned max_index,enum pipe_prim_type prim,unsigned start,unsigned count,unsigned start_instance,unsigned instance_count)182 svga_hwtnl_draw_range_elements(struct svga_hwtnl *hwtnl,
183                                struct pipe_resource *index_buffer,
184                                unsigned index_size, int index_bias,
185                                unsigned min_index, unsigned max_index,
186                                enum pipe_prim_type prim, unsigned start, unsigned count,
187                                unsigned start_instance, unsigned instance_count)
188 {
189    enum pipe_prim_type gen_prim;
190    unsigned gen_size, gen_nr;
191    enum indices_mode gen_type;
192    u_translate_func gen_func;
193    enum pipe_error ret = PIPE_OK;
194 
195    SVGA_STATS_TIME_PUSH(svga_sws(hwtnl->svga),
196                         SVGA_STATS_TIME_HWTNLDRAWELEMENTS);
197 
198    if (svga_need_unfilled_fallback(hwtnl, prim)) {
199       gen_type = u_unfilled_translator(prim,
200                                        index_size,
201                                        count,
202                                        hwtnl->api_fillmode,
203                                        &gen_prim,
204                                        &gen_size, &gen_nr, &gen_func);
205    }
206    else {
207       gen_type = u_index_translator(svga_hw_prims,
208                                     prim,
209                                     index_size,
210                                     count,
211                                     hwtnl->api_pv,
212                                     hwtnl->hw_pv,
213                                     PR_DISABLE,
214                                     &gen_prim, &gen_size, &gen_nr, &gen_func);
215    }
216 
217    if (gen_type == U_TRANSLATE_MEMCPY) {
218       /* No need for translation, just pass through to hardware:
219        */
220       ret = svga_hwtnl_simple_draw_range_elements(hwtnl, index_buffer,
221                                                    index_size,
222                                                    index_bias,
223                                                    min_index,
224                                                    max_index,
225                                                    gen_prim, start, count,
226                                                    start_instance,
227                                                    instance_count);
228    }
229    else {
230       struct pipe_resource *gen_buf = NULL;
231 
232       /* Need to allocate a new index buffer and run the translate
233        * func to populate it.  Could potentially cache this translated
234        * index buffer with the original to avoid future
235        * re-translations.  Not much point if we're just accelerating
236        * GL though, as index buffers are typically used only once
237        * there.
238        */
239       ret = translate_indices(hwtnl,
240                               index_buffer,
241                               start * index_size,
242                               prim, gen_prim,
243                               count, gen_nr, gen_size,
244                               gen_func, &gen_buf);
245       if (ret == PIPE_OK) {
246          ret = svga_hwtnl_simple_draw_range_elements(hwtnl,
247                                                      gen_buf,
248                                                      gen_size,
249                                                      index_bias,
250                                                      min_index,
251                                                      max_index,
252                                                      gen_prim, 0, gen_nr,
253                                                      start_instance,
254                                                      instance_count);
255       }
256 
257       if (gen_buf) {
258          pipe_resource_reference(&gen_buf, NULL);
259       }
260    }
261 
262    SVGA_STATS_TIME_POP(svga_sws(hwtnl->svga));
263    return ret;
264 }
265