1 /**********************************************************
2  * Copyright 2008-2009 VMware, Inc.  All rights reserved.
3  *
4  * Permission is hereby granted, free of charge, to any person
5  * obtaining a copy of this software and associated documentation
6  * files (the "Software"), to deal in the Software without
7  * restriction, including without limitation the rights to use, copy,
8  * modify, merge, publish, distribute, sublicense, and/or sell copies
9  * of the Software, and to permit persons to whom the Software is
10  * furnished to do so, subject to the following conditions:
11  *
12  * The above copyright notice and this permission notice shall be
13  * included in all copies or substantial portions of the Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22  * SOFTWARE.
23  *
24  **********************************************************/
25 
26 #include "util/u_inlines.h"
27 #include "pipe/p_defines.h"
28 
29 #include "svga_screen.h"
30 #include "svga_context.h"
31 #include "svga_state.h"
32 #include "svga_cmd.h"
33 #include "svga_tgsi.h"
34 #include "svga_debug.h"
35 
36 #include "svga_hw_reg.h"
37 
38 
39 /*
40  * Don't try to send more than 4kb of successive constants.
41  */
42 #define MAX_CONST_REG_COUNT 256  /**< number of float[4] constants */
43 
44 
45 
46 /**
47  * Convert from PIPE_SHADER_* to SVGA3D_SHADERTYPE_*
48  */
49 static int
svga_shader_type(unsigned shader)50 svga_shader_type(unsigned shader)
51 {
52    assert(PIPE_SHADER_VERTEX + 1 == SVGA3D_SHADERTYPE_VS);
53    assert(PIPE_SHADER_FRAGMENT + 1 == SVGA3D_SHADERTYPE_PS);
54    assert(shader <= PIPE_SHADER_FRAGMENT);
55    return shader + 1;
56 }
57 
58 
59 /**
60  * Check and emit one shader constant register.
61  * \param shader  PIPE_SHADER_FRAGMENT or PIPE_SHADER_VERTEX
62  * \param i  which float[4] constant to change
63  * \param value  the new float[4] value
64  */
65 static enum pipe_error
emit_const(struct svga_context * svga,unsigned shader,unsigned i,const float * value)66 emit_const(struct svga_context *svga, unsigned shader, unsigned i,
67            const float *value)
68 {
69    enum pipe_error ret = PIPE_OK;
70 
71    assert(shader < PIPE_SHADER_TYPES);
72    assert(i < SVGA3D_CONSTREG_MAX);
73 
74    if (memcmp(svga->state.hw_draw.cb[shader][i], value,
75               4 * sizeof(float)) != 0) {
76       if (SVGA_DEBUG & DEBUG_CONSTS)
77          debug_printf("%s %s %u: %f %f %f %f\n",
78                       __FUNCTION__,
79                       shader == PIPE_SHADER_VERTEX ? "VERT" : "FRAG",
80                       i,
81                       value[0],
82                       value[1],
83                       value[2],
84                       value[3]);
85 
86       ret = SVGA3D_SetShaderConst( svga->swc,
87                                    i,
88                                    svga_shader_type(shader),
89                                    SVGA3D_CONST_TYPE_FLOAT,
90                                    value );
91       if (ret != PIPE_OK)
92          return ret;
93 
94       memcpy(svga->state.hw_draw.cb[shader][i], value, 4 * sizeof(float));
95    }
96 
97    return ret;
98 }
99 
100 
101 /*
102  * Check and emit a range of shader constant registers, trying to coalesce
103  * successive shader constant updates in a single command in order to save
104  * space on the command buffer.  This is a HWv8 feature.
105  */
106 static enum pipe_error
emit_const_range(struct svga_context * svga,unsigned shader,unsigned offset,unsigned count,const float (* values)[4])107 emit_const_range(struct svga_context *svga,
108                  unsigned shader,
109                  unsigned offset,
110                  unsigned count,
111                  const float (*values)[4])
112 {
113    unsigned i, j;
114    enum pipe_error ret;
115 
116 #ifdef DEBUG
117    if (offset + count > SVGA3D_CONSTREG_MAX) {
118       debug_printf("svga: too many constants (offset + count = %u)\n",
119                    offset + count);
120    }
121 #endif
122 
123    if (offset > SVGA3D_CONSTREG_MAX) {
124       /* This isn't OK, but if we propagate an error all the way up we'll
125        * just get into more trouble.
126        * XXX note that offset is always zero at this time so this is moot.
127        */
128       return PIPE_OK;
129    }
130 
131    if (offset + count > SVGA3D_CONSTREG_MAX) {
132       /* Just drop the extra constants for now.
133        * Ideally we should not have allowed the app to create a shader
134        * that exceeds our constant buffer size but there's no way to
135        * express that in gallium at this time.
136        */
137       count = SVGA3D_CONSTREG_MAX - offset;
138    }
139 
140    i = 0;
141    while (i < count) {
142       if (memcmp(svga->state.hw_draw.cb[shader][offset + i],
143                  values[i],
144                  4 * sizeof(float)) != 0) {
145          /* Found one dirty constant
146           */
147          if (SVGA_DEBUG & DEBUG_CONSTS)
148             debug_printf("%s %s %d: %f %f %f %f\n",
149                          __FUNCTION__,
150                          shader == PIPE_SHADER_VERTEX ? "VERT" : "FRAG",
151                          offset + i,
152                          values[i][0],
153                          values[i][1],
154                          values[i][2],
155                          values[i][3]);
156 
157          /* Look for more consecutive dirty constants.
158           */
159          j = i + 1;
160          while (j < count &&
161                 j < i + MAX_CONST_REG_COUNT &&
162                 memcmp(svga->state.hw_draw.cb[shader][offset + j],
163                        values[j],
164                        4 * sizeof(float)) != 0) {
165 
166             if (SVGA_DEBUG & DEBUG_CONSTS)
167                debug_printf("%s %s %d: %f %f %f %f\n",
168                             __FUNCTION__,
169                             shader == PIPE_SHADER_VERTEX ? "VERT" : "FRAG",
170                             offset + j,
171                             values[j][0],
172                             values[j][1],
173                             values[j][2],
174                             values[j][3]);
175 
176             ++j;
177          }
178 
179          assert(j >= i + 1);
180 
181          /* Send them all together.
182           */
183          ret = SVGA3D_SetShaderConsts(svga->swc,
184                                       offset + i, j - i,
185                                       svga_shader_type(shader),
186                                       SVGA3D_CONST_TYPE_FLOAT,
187                                       values + i);
188          if (ret != PIPE_OK) {
189             return ret;
190          }
191 
192          /*
193           * Local copy of the hardware state.
194           */
195          memcpy(svga->state.hw_draw.cb[shader][offset + i],
196                 values[i],
197                 (j - i) * 4 * sizeof(float));
198 
199          i = j + 1;
200       } else {
201          ++i;
202       }
203    }
204 
205    return PIPE_OK;
206 }
207 
208 
209 /**
210  * Emit all the constants in a constant buffer for a shader stage.
211  */
212 static enum pipe_error
emit_consts(struct svga_context * svga,unsigned shader)213 emit_consts(struct svga_context *svga, unsigned shader)
214 {
215    struct svga_screen *ss = svga_screen(svga->pipe.screen);
216    struct pipe_transfer *transfer = NULL;
217    unsigned count;
218    const float (*data)[4] = NULL;
219    unsigned i;
220    enum pipe_error ret = PIPE_OK;
221    const unsigned offset = 0;
222 
223    assert(shader < PIPE_SHADER_TYPES);
224 
225    if (svga->curr.cb[shader] == NULL)
226       goto done;
227 
228    count = svga->curr.cb[shader]->width0 / (4 * sizeof(float));
229 
230    data = (const float (*)[4])pipe_buffer_map(&svga->pipe,
231                                               svga->curr.cb[shader],
232                                               PIPE_TRANSFER_READ,
233 					      &transfer);
234    if (data == NULL) {
235       ret = PIPE_ERROR_OUT_OF_MEMORY;
236       goto done;
237    }
238 
239    if (ss->hw_version >= SVGA3D_HWVERSION_WS8_B1) {
240       ret = emit_const_range( svga, shader, offset, count, data );
241       if (ret != PIPE_OK) {
242          goto done;
243       }
244    } else {
245       for (i = 0; i < count; i++) {
246          ret = emit_const( svga, shader, offset + i, data[i] );
247          if (ret != PIPE_OK) {
248             goto done;
249          }
250       }
251    }
252 
253 done:
254    if (data)
255       pipe_buffer_unmap(&svga->pipe, transfer);
256 
257    return ret;
258 }
259 
260 
261 static enum pipe_error
emit_fs_consts(struct svga_context * svga,unsigned dirty)262 emit_fs_consts(struct svga_context *svga, unsigned dirty)
263 {
264    const struct svga_shader_result *result = svga->state.hw_draw.fs;
265    enum pipe_error ret = PIPE_OK;
266 
267    ret = emit_consts( svga, PIPE_SHADER_FRAGMENT );
268    if (ret != PIPE_OK)
269       return ret;
270 
271    /* The internally generated fragment shader for xor blending
272     * doesn't have a 'result' struct.  It should be fixed to avoid
273     * this special case, but work around it with a NULL check:
274     */
275    if (result) {
276       const struct svga_fs_compile_key *key = &result->key.fkey;
277       if (key->num_unnormalized_coords) {
278          const unsigned offset =
279             result->shader->info.file_max[TGSI_FILE_CONSTANT] + 1;
280          unsigned i;
281 
282          for (i = 0; i < key->num_textures; i++) {
283             if (key->tex[i].unnormalized) {
284                struct pipe_resource *tex = svga->curr.sampler_views[i]->texture;
285                float data[4];
286 
287                data[0] = 1.0f / (float) tex->width0;
288                data[1] = 1.0f / (float) tex->height0;
289                data[2] = 1.0f;
290                data[3] = 1.0f;
291 
292                ret = emit_const(svga,
293                                 PIPE_SHADER_FRAGMENT,
294                                 key->tex[i].width_height_idx + offset,
295                                 data);
296                if (ret != PIPE_OK) {
297                   return ret;
298                }
299             }
300          }
301       }
302    }
303 
304    return PIPE_OK;
305 }
306 
307 
308 struct svga_tracked_state svga_hw_fs_constants =
309 {
310    "hw fs params",
311    (SVGA_NEW_FS_CONST_BUFFER |
312     SVGA_NEW_FS_RESULT |
313     SVGA_NEW_TEXTURE_BINDING),
314    emit_fs_consts
315 };
316 
317 
318 
319 static enum pipe_error
emit_vs_consts(struct svga_context * svga,unsigned dirty)320 emit_vs_consts(struct svga_context *svga, unsigned dirty)
321 {
322    const struct svga_shader_result *result = svga->state.hw_draw.vs;
323    const struct svga_vs_compile_key *key;
324    enum pipe_error ret = PIPE_OK;
325    unsigned offset;
326 
327    /* SVGA_NEW_VS_RESULT
328     */
329    if (result == NULL)
330       return PIPE_OK;
331 
332    key = &result->key.vkey;
333 
334    /* SVGA_NEW_VS_CONST_BUFFER
335     */
336    ret = emit_consts( svga, PIPE_SHADER_VERTEX );
337    if (ret != PIPE_OK)
338       return ret;
339 
340    /* offset = number of constants in the VS const buffer */
341    offset = result->shader->info.file_max[TGSI_FILE_CONSTANT] + 1;
342 
343    /* SVGA_NEW_VS_PRESCALE
344     * Put the viewport pre-scale/translate values into the const buffer.
345     */
346    if (key->need_prescale) {
347       ret = emit_const( svga, PIPE_SHADER_VERTEX, offset++,
348                         svga->state.hw_clear.prescale.scale );
349       if (ret != PIPE_OK)
350          return ret;
351 
352       ret = emit_const( svga, PIPE_SHADER_VERTEX, offset++,
353                         svga->state.hw_clear.prescale.translate );
354       if (ret != PIPE_OK)
355          return ret;
356    }
357 
358    return PIPE_OK;
359 }
360 
361 
362 struct svga_tracked_state svga_hw_vs_constants =
363 {
364    "hw vs params",
365    (SVGA_NEW_PRESCALE |
366     SVGA_NEW_VS_CONST_BUFFER |
367     SVGA_NEW_VS_RESULT),
368    emit_vs_consts
369 };
370