1 /**************************************************************************
2  *
3  * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
4  * All Rights Reserved.
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a
7  * copy of this software and associated documentation files (the
8  * "Software"), to deal in the Software without restriction, including
9  * without limitation the rights to use, copy, modify, merge, publish,
10  * distribute, sub license, and/or sell copies of the Software, and to
11  * permit persons to whom the Software is furnished to do so, subject to
12  * the following conditions:
13  *
14  * The above copyright notice and this permission notice (including the
15  * next paragraph) shall be included in all copies or substantial portions
16  * of the Software.
17  *
18  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21  * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22  * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23  * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24  * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25  *
26  **************************************************************************/
27 
28 /*
29  * Render unclipped vertex buffers by emitting vertices directly to
30  * dma buffers.  Use strip/fan hardware acceleration where possible.
31  *
32  */
33 #include "main/glheader.h"
34 #include "main/context.h"
35 #include "main/macros.h"
36 #include "main/imports.h"
37 #include "main/mtypes.h"
38 #include "main/enums.h"
39 
40 #include "math/m_xform.h"
41 
42 #include "tnl/t_context.h"
43 #include "tnl/t_vertex.h"
44 #include "tnl/t_pipeline.h"
45 
46 #include "intel_screen.h"
47 #include "intel_context.h"
48 #include "intel_tris.h"
49 #include "intel_batchbuffer.h"
50 #include "intel_reg.h"
51 
52 /*
53  * Render unclipped vertex buffers by emitting vertices directly to
54  * dma buffers.  Use strip/fan hardware primitives where possible.
55  * Try to simulate missing primitives with indexed vertices.
56  */
57 #define HAVE_POINTS      0      /* Has it, but can't use because subpixel has to
58                                  * be adjusted for points on the INTEL/I845G
59                                  */
60 #define HAVE_LINES       1
61 #define HAVE_LINE_STRIPS 1
62 #define HAVE_TRIANGLES   1
63 #define HAVE_TRI_STRIPS  1
64 #define HAVE_TRI_STRIP_1 0      /* has it, template can't use it yet */
65 #define HAVE_TRI_FANS    1
66 #define HAVE_POLYGONS    1
67 #define HAVE_QUADS       0
68 #define HAVE_QUAD_STRIPS 0
69 
70 #define HAVE_ELTS        0
71 
72 static uint32_t hw_prim[GL_POLYGON + 1] = {
73    0,
74    PRIM3D_LINELIST,
75    PRIM3D_LINESTRIP,
76    PRIM3D_LINESTRIP,
77    PRIM3D_TRILIST,
78    PRIM3D_TRISTRIP,
79    PRIM3D_TRIFAN,
80    0,
81    0,
82    PRIM3D_POLY
83 };
84 
85 static const GLenum reduced_prim[GL_POLYGON + 1] = {
86    GL_POINTS,
87    GL_LINES,
88    GL_LINES,
89    GL_LINES,
90    GL_TRIANGLES,
91    GL_TRIANGLES,
92    GL_TRIANGLES,
93    GL_TRIANGLES,
94    GL_TRIANGLES,
95    GL_TRIANGLES
96 };
97 
98 static const int scale_prim[GL_POLYGON + 1] = {
99    0,                           /* fallback case */
100    1,
101    2,
102    2,
103    1,
104    3,
105    3,
106    0,                           /* fallback case */
107    0,                           /* fallback case */
108    3
109 };
110 
111 
112 static void
intelDmaPrimitive(struct intel_context * intel,GLenum prim)113 intelDmaPrimitive(struct intel_context *intel, GLenum prim)
114 {
115    if (0)
116       fprintf(stderr, "%s %s\n", __FUNCTION__, _mesa_lookup_enum_by_nr(prim));
117    INTEL_FIREVERTICES(intel);
118    intel->vtbl.reduced_primitive_state(intel, reduced_prim[prim]);
119    intel_set_prim(intel, hw_prim[prim]);
120 }
121 
122 #define INTEL_NO_VBO_STATE_RESERVED 1500
123 
intel_get_vb_max(struct intel_context * intel)124 static INLINE GLuint intel_get_vb_max(struct intel_context *intel)
125 {
126    GLuint ret;
127 
128    if (intel->intelScreen->no_vbo) {
129       ret = intel->batch.bo->size - INTEL_NO_VBO_STATE_RESERVED;
130    } else
131       ret = INTEL_VB_SIZE;
132    ret /= (intel->vertex_size * 4);
133    return ret;
134 }
135 
intel_get_current_max(struct intel_context * intel)136 static INLINE GLuint intel_get_current_max(struct intel_context *intel)
137 {
138    GLuint ret;
139 
140    if (intel->intelScreen->no_vbo) {
141       ret = intel_batchbuffer_space(intel);
142       ret = ret <= INTEL_NO_VBO_STATE_RESERVED ? 0 : ret - INTEL_NO_VBO_STATE_RESERVED;
143    } else
144       ret = (INTEL_VB_SIZE - intel->prim.current_offset);
145 
146    return ret / (intel->vertex_size * 4);
147 }
148 
149 #define LOCAL_VARS struct intel_context *intel = intel_context(ctx)
150 #define INIT( prim ) 				\
151 do {						\
152    intelDmaPrimitive( intel, prim );		\
153 } while (0)
154 
155 #define FLUSH() INTEL_FIREVERTICES(intel)
156 
157 #define GET_SUBSEQUENT_VB_MAX_VERTS() intel_get_vb_max(intel)
158 #define GET_CURRENT_VB_MAX_VERTS() intel_get_current_max(intel)
159 
160 #define ALLOC_VERTS(nr) intel_get_prim_space(intel, nr)
161 
162 #define EMIT_VERTS( ctx, j, nr, buf ) \
163   _tnl_emit_vertices_to_buffer(ctx, j, (j)+(nr), buf )
164 
165 #define TAG(x) intel_##x
166 #include "tnl_dd/t_dd_dmatmp.h"
167 
168 
169 /**********************************************************************/
170 /*                          Render pipeline stage                     */
171 /**********************************************************************/
172 
173 /* Heuristic to choose between the two render paths:
174  */
175 static bool
choose_render(struct intel_context * intel,struct vertex_buffer * VB)176 choose_render(struct intel_context *intel, struct vertex_buffer *VB)
177 {
178    int vertsz = intel->vertex_size;
179    int cost_render = 0;
180    int cost_fallback = 0;
181    int nr_prims = 0;
182    int nr_rprims = 0;
183    int nr_rverts = 0;
184    int rprim = intel->reduced_primitive;
185    int i = 0;
186 
187    for (i = 0; i < VB->PrimitiveCount; i++) {
188       GLuint prim = VB->Primitive[i].mode;
189       GLuint length = VB->Primitive[i].count;
190 
191       if (!length)
192          continue;
193 
194       nr_prims++;
195       nr_rverts += length * scale_prim[prim & PRIM_MODE_MASK];
196 
197       if (reduced_prim[prim & PRIM_MODE_MASK] != rprim) {
198          nr_rprims++;
199          rprim = reduced_prim[prim & PRIM_MODE_MASK];
200       }
201    }
202 
203    /* One point for each generated primitive:
204     */
205    cost_render = nr_prims;
206    cost_fallback = nr_rprims;
207 
208    /* One point for every 1024 dwords (4k) of dma:
209     */
210    cost_render += (vertsz * i) / 1024;
211    cost_fallback += (vertsz * nr_rverts) / 1024;
212 
213    if (0)
214       fprintf(stderr, "cost render: %d fallback: %d\n",
215               cost_render, cost_fallback);
216 
217    if (cost_render > cost_fallback)
218       return false;
219 
220    return true;
221 }
222 
223 
224 static GLboolean
intel_run_render(struct gl_context * ctx,struct tnl_pipeline_stage * stage)225 intel_run_render(struct gl_context * ctx, struct tnl_pipeline_stage *stage)
226 {
227    struct intel_context *intel = intel_context(ctx);
228    TNLcontext *tnl = TNL_CONTEXT(ctx);
229    struct vertex_buffer *VB = &tnl->vb;
230    GLuint i;
231 
232    intel->vtbl.render_prevalidate( intel );
233 
234    /* Don't handle clipping or indexed vertices.
235     */
236    if (intel->RenderIndex != 0 ||
237        !intel_validate_render(ctx, VB) || !choose_render(intel, VB)) {
238       return true;
239    }
240 
241    tnl->clipspace.new_inputs |= VERT_BIT_POS;
242 
243    tnl->Driver.Render.Start(ctx);
244 
245    for (i = 0; i < VB->PrimitiveCount; i++) {
246       GLuint prim = _tnl_translate_prim(&VB->Primitive[i]);
247       GLuint start = VB->Primitive[i].start;
248       GLuint length = VB->Primitive[i].count;
249 
250       if (!length)
251          continue;
252 
253       intel_render_tab_verts[prim & PRIM_MODE_MASK] (ctx, start,
254                                                      start + length, prim);
255    }
256 
257    tnl->Driver.Render.Finish(ctx);
258 
259    INTEL_FIREVERTICES(intel);
260 
261    return false;             /* finished the pipe */
262 }
263 
264 static const struct tnl_pipeline_stage _intel_render_stage = {
265    "intel render",
266    NULL,
267    NULL,
268    NULL,
269    NULL,
270    intel_run_render             /* run */
271 };
272 
273 const struct tnl_pipeline_stage *intel_pipeline[] = {
274    &_tnl_vertex_transform_stage,
275    &_tnl_normal_transform_stage,
276    &_tnl_lighting_stage,
277    &_tnl_fog_coordinate_stage,
278    &_tnl_texgen_stage,
279    &_tnl_texture_transform_stage,
280    &_tnl_point_attenuation_stage,
281    &_tnl_vertex_program_stage,
282 #if 1
283    &_intel_render_stage,        /* ADD: unclipped rastersetup-to-dma */
284 #endif
285    &_tnl_render_stage,
286    0,
287 };
288