1 /*
2 Copyright (C) Intel Corp. 2006. All Rights Reserved.
3 Intel funded Tungsten Graphics (http://www.tungstengraphics.com) to
4 develop this 3D driver.
5
6 Permission is hereby granted, free of charge, to any person obtaining
7 a copy of this software and associated documentation files (the
8 "Software"), to deal in the Software without restriction, including
9 without limitation the rights to use, copy, modify, merge, publish,
10 distribute, sublicense, and/or sell copies of the Software, and to
11 permit persons to whom the Software is furnished to do so, subject to
12 the following conditions:
13
14 The above copyright notice and this permission notice (including the
15 next paragraph) shall be included in all copies or substantial
16 portions of the Software.
17
18 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
19 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
21 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
22 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
23 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
24 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25
26 **********************************************************************/
27 /*
28 * Authors:
29 * Keith Whitwell <keith@tungstengraphics.com>
30 */
31
32 #include "main/glheader.h"
33 #include "main/macros.h"
34 #include "main/enums.h"
35 #include "program/program.h"
36
37 #include "intel_batchbuffer.h"
38
39 #include "brw_defines.h"
40 #include "brw_context.h"
41 #include "brw_eu.h"
42 #include "brw_clip.h"
43
44
45
brw_clip_line_alloc_regs(struct brw_clip_compile * c)46 static void brw_clip_line_alloc_regs( struct brw_clip_compile *c )
47 {
48 struct intel_context *intel = &c->func.brw->intel;
49 GLuint i = 0,j;
50
51 /* Register usage is static, precompute here:
52 */
53 c->reg.R0 = retype(brw_vec8_grf(i, 0), BRW_REGISTER_TYPE_UD); i++;
54
55 if (c->key.nr_userclip) {
56 c->reg.fixed_planes = brw_vec4_grf(i, 0);
57 i += (6 + c->key.nr_userclip + 1) / 2;
58
59 c->prog_data.curb_read_length = (6 + c->key.nr_userclip + 1) / 2;
60 }
61 else
62 c->prog_data.curb_read_length = 0;
63
64
65 /* Payload vertices plus space for more generated vertices:
66 */
67 for (j = 0; j < 4; j++) {
68 c->reg.vertex[j] = brw_vec4_grf(i, 0);
69 i += c->nr_regs;
70 }
71
72 c->reg.t = brw_vec1_grf(i, 0);
73 c->reg.t0 = brw_vec1_grf(i, 1);
74 c->reg.t1 = brw_vec1_grf(i, 2);
75 c->reg.planemask = retype(brw_vec1_grf(i, 3), BRW_REGISTER_TYPE_UD);
76 c->reg.plane_equation = brw_vec4_grf(i, 4);
77 i++;
78
79 c->reg.dp0 = brw_vec1_grf(i, 0); /* fixme - dp4 will clobber r.1,2,3 */
80 c->reg.dp1 = brw_vec1_grf(i, 4);
81 i++;
82
83 if (!c->key.nr_userclip) {
84 c->reg.fixed_planes = brw_vec8_grf(i, 0);
85 i++;
86 }
87
88 if (intel->needs_ff_sync) {
89 c->reg.ff_sync = retype(brw_vec1_grf(i, 0), BRW_REGISTER_TYPE_UD);
90 i++;
91 }
92
93 c->first_tmp = i;
94 c->last_tmp = i;
95
96 c->prog_data.urb_read_length = c->nr_regs; /* ? */
97 c->prog_data.total_grf = i;
98 }
99
100
101
102 /* Line clipping, more or less following the following algorithm:
103 *
104 * for (p=0;p<MAX_PLANES;p++) {
105 * if (clipmask & (1 << p)) {
106 * GLfloat dp0 = DOTPROD( vtx0, plane[p] );
107 * GLfloat dp1 = DOTPROD( vtx1, plane[p] );
108 *
109 * if (IS_NEGATIVE(dp1)) {
110 * GLfloat t = dp1 / (dp1 - dp0);
111 * if (t > t1) t1 = t;
112 * } else {
113 * GLfloat t = dp0 / (dp0 - dp1);
114 * if (t > t0) t0 = t;
115 * }
116 *
117 * if (t0 + t1 >= 1.0)
118 * return;
119 * }
120 * }
121 *
122 * interp( ctx, newvtx0, vtx0, vtx1, t0 );
123 * interp( ctx, newvtx1, vtx1, vtx0, t1 );
124 *
125 */
clip_and_emit_line(struct brw_clip_compile * c)126 static void clip_and_emit_line( struct brw_clip_compile *c )
127 {
128 struct brw_compile *p = &c->func;
129 struct brw_context *brw = p->brw;
130 struct brw_indirect vtx0 = brw_indirect(0, 0);
131 struct brw_indirect vtx1 = brw_indirect(1, 0);
132 struct brw_indirect newvtx0 = brw_indirect(2, 0);
133 struct brw_indirect newvtx1 = brw_indirect(3, 0);
134 struct brw_indirect plane_ptr = brw_indirect(4, 0);
135 struct brw_reg v1_null_ud = retype(vec1(brw_null_reg()), BRW_REGISTER_TYPE_UD);
136 GLuint hpos_offset = brw_vert_result_to_offset(&c->vue_map,
137 VERT_RESULT_HPOS);
138
139 brw_MOV(p, get_addr_reg(vtx0), brw_address(c->reg.vertex[0]));
140 brw_MOV(p, get_addr_reg(vtx1), brw_address(c->reg.vertex[1]));
141 brw_MOV(p, get_addr_reg(newvtx0), brw_address(c->reg.vertex[2]));
142 brw_MOV(p, get_addr_reg(newvtx1), brw_address(c->reg.vertex[3]));
143 brw_MOV(p, get_addr_reg(plane_ptr), brw_clip_plane0_address(c));
144
145 /* Note: init t0, t1 together:
146 */
147 brw_MOV(p, vec2(c->reg.t0), brw_imm_f(0));
148
149 brw_clip_init_planes(c);
150 brw_clip_init_clipmask(c);
151
152 /* -ve rhw workaround */
153 if (brw->has_negative_rhw_bug) {
154 brw_set_conditionalmod(p, BRW_CONDITIONAL_NZ);
155 brw_AND(p, brw_null_reg(), get_element_ud(c->reg.R0, 2),
156 brw_imm_ud(1<<20));
157 brw_OR(p, c->reg.planemask, c->reg.planemask, brw_imm_ud(0x3f));
158 }
159
160 brw_set_predicate_control(p, BRW_PREDICATE_NONE);
161
162 brw_DO(p, BRW_EXECUTE_1);
163 {
164 /* if (planemask & 1)
165 */
166 brw_set_conditionalmod(p, BRW_CONDITIONAL_NZ);
167 brw_AND(p, v1_null_ud, c->reg.planemask, brw_imm_ud(1));
168
169 brw_IF(p, BRW_EXECUTE_1);
170 {
171 if (c->key.nr_userclip)
172 brw_MOV(p, c->reg.plane_equation, deref_4f(plane_ptr, 0));
173 else
174 brw_MOV(p, c->reg.plane_equation, deref_4b(plane_ptr, 0));
175
176 /* dp = DP4(vtx->position, plane)
177 */
178 brw_DP4(p, vec4(c->reg.dp0), deref_4f(vtx0, hpos_offset), c->reg.plane_equation);
179
180 /* if (IS_NEGATIVE(dp1))
181 */
182 brw_set_conditionalmod(p, BRW_CONDITIONAL_L);
183 brw_DP4(p, vec4(c->reg.dp1), deref_4f(vtx1, hpos_offset), c->reg.plane_equation);
184 brw_IF(p, BRW_EXECUTE_1);
185 {
186 /*
187 * Both can be negative on GM965/G965 due to RHW workaround
188 * if so, this object should be rejected.
189 */
190 if (brw->has_negative_rhw_bug) {
191 brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_LE, c->reg.dp0, brw_imm_f(0.0));
192 brw_IF(p, BRW_EXECUTE_1);
193 {
194 brw_clip_kill_thread(c);
195 }
196 brw_ENDIF(p);
197 }
198
199 brw_ADD(p, c->reg.t, c->reg.dp1, negate(c->reg.dp0));
200 brw_math_invert(p, c->reg.t, c->reg.t);
201 brw_MUL(p, c->reg.t, c->reg.t, c->reg.dp1);
202
203 brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_G, c->reg.t, c->reg.t1 );
204 brw_MOV(p, c->reg.t1, c->reg.t);
205 brw_set_predicate_control(p, BRW_PREDICATE_NONE);
206 }
207 brw_ELSE(p);
208 {
209 /* Coming back in. We know that both cannot be negative
210 * because the line would have been culled in that case.
211 */
212
213 /* If both are positive, do nothing */
214 /* Only on GM965/G965 */
215 if (brw->has_negative_rhw_bug) {
216 brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_L, c->reg.dp0, brw_imm_f(0.0));
217 brw_IF(p, BRW_EXECUTE_1);
218 }
219
220 {
221 brw_ADD(p, c->reg.t, c->reg.dp0, negate(c->reg.dp1));
222 brw_math_invert(p, c->reg.t, c->reg.t);
223 brw_MUL(p, c->reg.t, c->reg.t, c->reg.dp0);
224
225 brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_G, c->reg.t, c->reg.t0 );
226 brw_MOV(p, c->reg.t0, c->reg.t);
227 brw_set_predicate_control(p, BRW_PREDICATE_NONE);
228 }
229
230 if (brw->has_negative_rhw_bug) {
231 brw_ENDIF(p);
232 }
233 }
234 brw_ENDIF(p);
235 }
236 brw_ENDIF(p);
237
238 /* plane_ptr++;
239 */
240 brw_ADD(p, get_addr_reg(plane_ptr), get_addr_reg(plane_ptr), brw_clip_plane_stride(c));
241
242 /* while (planemask>>=1) != 0
243 */
244 brw_set_conditionalmod(p, BRW_CONDITIONAL_NZ);
245 brw_SHR(p, c->reg.planemask, c->reg.planemask, brw_imm_ud(1));
246 }
247 brw_WHILE(p);
248
249 brw_ADD(p, c->reg.t, c->reg.t0, c->reg.t1);
250 brw_CMP(p, vec1(brw_null_reg()), BRW_CONDITIONAL_L, c->reg.t, brw_imm_f(1.0));
251 brw_IF(p, BRW_EXECUTE_1);
252 {
253 brw_clip_interp_vertex(c, newvtx0, vtx0, vtx1, c->reg.t0, false);
254 brw_clip_interp_vertex(c, newvtx1, vtx1, vtx0, c->reg.t1, false);
255
256 brw_clip_emit_vue(c, newvtx0, 1, 0,
257 (_3DPRIM_LINESTRIP << URB_WRITE_PRIM_TYPE_SHIFT)
258 | URB_WRITE_PRIM_START);
259 brw_clip_emit_vue(c, newvtx1, 0, 1,
260 (_3DPRIM_LINESTRIP << URB_WRITE_PRIM_TYPE_SHIFT)
261 | URB_WRITE_PRIM_END);
262 }
263 brw_ENDIF(p);
264 brw_clip_kill_thread(c);
265 }
266
267
268
brw_emit_line_clip(struct brw_clip_compile * c)269 void brw_emit_line_clip( struct brw_clip_compile *c )
270 {
271 brw_clip_line_alloc_regs(c);
272 brw_clip_init_ff_sync(c);
273
274 if (c->key.do_flat_shading) {
275 if (c->key.pv_first)
276 brw_clip_copy_colors(c, 1, 0);
277 else
278 brw_clip_copy_colors(c, 0, 1);
279 }
280
281 clip_and_emit_line(c);
282 }
283