1 /*
2 * Copyright (C) 2010 Corbin Simpson
3 * Copyright (C) 2010 Marek Olšák <maraeo@gmail.com>
4 *
5 * All Rights Reserved.
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining
8 * a copy of this software and associated documentation files (the
9 * "Software"), to deal in the Software without restriction, including
10 * without limitation the rights to use, copy, modify, merge, publish,
11 * distribute, sublicense, and/or sell copies of the Software, and to
12 * permit persons to whom the Software is furnished to do so, subject to
13 * the following conditions:
14 *
15 * The above copyright notice and this permission notice (including the
16 * next paragraph) shall be included in all copies or substantial
17 * portions of the Software.
18 *
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
20 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
21 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
22 * IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
23 * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
24 * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
25 * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 *
27 */
28
29 #include "radeon_program_tex.h"
30
31 #include "radeon_compiler_util.h"
32
33 /* Series of transformations to be done on textures. */
34
shadow_fail_value(struct r300_fragment_program_compiler * compiler,int tmu)35 static struct rc_src_register shadow_fail_value(struct r300_fragment_program_compiler *compiler,
36 int tmu)
37 {
38 struct rc_src_register reg = { 0, 0, 0, 0, 0, 0 };
39
40 reg.File = RC_FILE_NONE;
41 reg.Swizzle = combine_swizzles(RC_SWIZZLE_0000,
42 compiler->state.unit[tmu].texture_swizzle);
43 return reg;
44 }
45
shadow_pass_value(struct r300_fragment_program_compiler * compiler,int tmu)46 static struct rc_src_register shadow_pass_value(struct r300_fragment_program_compiler *compiler,
47 int tmu)
48 {
49 struct rc_src_register reg = { 0, 0, 0, 0, 0, 0 };
50
51 reg.File = RC_FILE_NONE;
52 reg.Swizzle = combine_swizzles(RC_SWIZZLE_1111,
53 compiler->state.unit[tmu].texture_swizzle);
54 return reg;
55 }
56
scale_texcoords(struct r300_fragment_program_compiler * compiler,struct rc_instruction * inst,unsigned state_constant)57 static void scale_texcoords(struct r300_fragment_program_compiler *compiler,
58 struct rc_instruction *inst,
59 unsigned state_constant)
60 {
61 struct rc_instruction *inst_mov;
62
63 unsigned temp = rc_find_free_temporary(&compiler->Base);
64
65 inst_mov = rc_insert_new_instruction(&compiler->Base, inst->Prev);
66
67 inst_mov->U.I.Opcode = RC_OPCODE_MUL;
68 inst_mov->U.I.DstReg.File = RC_FILE_TEMPORARY;
69 inst_mov->U.I.DstReg.Index = temp;
70 inst_mov->U.I.SrcReg[0] = inst->U.I.SrcReg[0];
71 inst_mov->U.I.SrcReg[1].File = RC_FILE_CONSTANT;
72 inst_mov->U.I.SrcReg[1].Index =
73 rc_constants_add_state(&compiler->Base.Program.Constants,
74 state_constant, inst->U.I.TexSrcUnit);
75
76 reset_srcreg(&inst->U.I.SrcReg[0]);
77 inst->U.I.SrcReg[0].File = RC_FILE_TEMPORARY;
78 inst->U.I.SrcReg[0].Index = temp;
79 }
80
projective_divide(struct r300_fragment_program_compiler * compiler,struct rc_instruction * inst)81 static void projective_divide(struct r300_fragment_program_compiler *compiler,
82 struct rc_instruction *inst)
83 {
84 struct rc_instruction *inst_mul, *inst_rcp;
85
86 unsigned temp = rc_find_free_temporary(&compiler->Base);
87
88 inst_rcp = rc_insert_new_instruction(&compiler->Base, inst->Prev);
89 inst_rcp->U.I.Opcode = RC_OPCODE_RCP;
90 inst_rcp->U.I.DstReg.File = RC_FILE_TEMPORARY;
91 inst_rcp->U.I.DstReg.Index = temp;
92 inst_rcp->U.I.DstReg.WriteMask = RC_MASK_W;
93 inst_rcp->U.I.SrcReg[0] = inst->U.I.SrcReg[0];
94 /* Because the input can be arbitrarily swizzled,
95 * read the component mapped to W. */
96 inst_rcp->U.I.SrcReg[0].Swizzle =
97 RC_MAKE_SWIZZLE_SMEAR(GET_SWZ(inst->U.I.SrcReg[0].Swizzle, 3));
98
99 inst_mul = rc_insert_new_instruction(&compiler->Base, inst->Prev);
100 inst_mul->U.I.Opcode = RC_OPCODE_MUL;
101 inst_mul->U.I.DstReg.File = RC_FILE_TEMPORARY;
102 inst_mul->U.I.DstReg.Index = temp;
103 inst_mul->U.I.SrcReg[0] = inst->U.I.SrcReg[0];
104 inst_mul->U.I.SrcReg[1].File = RC_FILE_TEMPORARY;
105 inst_mul->U.I.SrcReg[1].Index = temp;
106 inst_mul->U.I.SrcReg[1].Swizzle = RC_SWIZZLE_WWWW;
107
108 reset_srcreg(&inst->U.I.SrcReg[0]);
109 inst->U.I.Opcode = RC_OPCODE_TEX;
110 inst->U.I.SrcReg[0].File = RC_FILE_TEMPORARY;
111 inst->U.I.SrcReg[0].Index = temp;
112 }
113
114 /**
115 * Transform TEX, TXP, TXB, and KIL instructions in the following ways:
116 * - implement texture compare (shadow extensions)
117 * - extract non-native source / destination operands
118 * - premultiply texture coordinates for RECT
119 * - extract operand swizzles
120 * - introduce a temporary register when write masks are needed
121 */
radeonTransformTEX(struct radeon_compiler * c,struct rc_instruction * inst,void * data)122 int radeonTransformTEX(
123 struct radeon_compiler * c,
124 struct rc_instruction * inst,
125 void* data)
126 {
127 struct r300_fragment_program_compiler *compiler =
128 (struct r300_fragment_program_compiler*)data;
129 rc_wrap_mode wrapmode = compiler->state.unit[inst->U.I.TexSrcUnit].wrap_mode;
130 int is_rect = inst->U.I.TexSrcTarget == RC_TEXTURE_RECT ||
131 compiler->state.unit[inst->U.I.TexSrcUnit].non_normalized_coords;
132
133 if (inst->U.I.Opcode != RC_OPCODE_TEX &&
134 inst->U.I.Opcode != RC_OPCODE_TXB &&
135 inst->U.I.Opcode != RC_OPCODE_TXP &&
136 inst->U.I.Opcode != RC_OPCODE_TXD &&
137 inst->U.I.Opcode != RC_OPCODE_TXL &&
138 inst->U.I.Opcode != RC_OPCODE_KIL)
139 return 0;
140
141 /* ARB_shadow & EXT_shadow_funcs */
142 if (inst->U.I.Opcode != RC_OPCODE_KIL &&
143 ((c->Program.ShadowSamplers & (1 << inst->U.I.TexSrcUnit)) ||
144 (compiler->state.unit[inst->U.I.TexSrcUnit].compare_mode_enabled))) {
145 rc_compare_func comparefunc = compiler->state.unit[inst->U.I.TexSrcUnit].texture_compare_func;
146
147 if (comparefunc == RC_COMPARE_FUNC_NEVER || comparefunc == RC_COMPARE_FUNC_ALWAYS) {
148 inst->U.I.Opcode = RC_OPCODE_MOV;
149
150 if (comparefunc == RC_COMPARE_FUNC_ALWAYS) {
151 inst->U.I.SrcReg[0] = shadow_pass_value(compiler, inst->U.I.TexSrcUnit);
152 } else {
153 inst->U.I.SrcReg[0] = shadow_fail_value(compiler, inst->U.I.TexSrcUnit);
154 }
155
156 return 1;
157 } else {
158 struct rc_instruction * inst_rcp = NULL;
159 struct rc_instruction *inst_mul, *inst_add, *inst_cmp;
160 unsigned tmp_texsample;
161 unsigned tmp_sum;
162 int pass, fail;
163
164 /* Save the output register. */
165 struct rc_dst_register output_reg = inst->U.I.DstReg;
166 unsigned saturate_mode = inst->U.I.SaturateMode;
167
168 /* Redirect TEX to a new temp. */
169 tmp_texsample = rc_find_free_temporary(c);
170 inst->U.I.SaturateMode = 0;
171 inst->U.I.DstReg.File = RC_FILE_TEMPORARY;
172 inst->U.I.DstReg.Index = tmp_texsample;
173 inst->U.I.DstReg.WriteMask = RC_MASK_XYZW;
174
175 tmp_sum = rc_find_free_temporary(c);
176
177 if (inst->U.I.Opcode == RC_OPCODE_TXP) {
178 /* Compute 1/W. */
179 inst_rcp = rc_insert_new_instruction(c, inst);
180 inst_rcp->U.I.Opcode = RC_OPCODE_RCP;
181 inst_rcp->U.I.DstReg.File = RC_FILE_TEMPORARY;
182 inst_rcp->U.I.DstReg.Index = tmp_sum;
183 inst_rcp->U.I.DstReg.WriteMask = RC_MASK_W;
184 inst_rcp->U.I.SrcReg[0] = inst->U.I.SrcReg[0];
185 inst_rcp->U.I.SrcReg[0].Swizzle =
186 RC_MAKE_SWIZZLE_SMEAR(GET_SWZ(inst->U.I.SrcReg[0].Swizzle, 3));
187 }
188
189 /* Divide Z by W (if it's TXP) and saturate. */
190 inst_mul = rc_insert_new_instruction(c, inst_rcp ? inst_rcp : inst);
191 inst_mul->U.I.Opcode = inst->U.I.Opcode == RC_OPCODE_TXP ? RC_OPCODE_MUL : RC_OPCODE_MOV;
192 inst_mul->U.I.DstReg.File = RC_FILE_TEMPORARY;
193 inst_mul->U.I.DstReg.Index = tmp_sum;
194 inst_mul->U.I.DstReg.WriteMask = RC_MASK_W;
195 inst_mul->U.I.SaturateMode = RC_SATURATE_ZERO_ONE;
196 inst_mul->U.I.SrcReg[0] = inst->U.I.SrcReg[0];
197 inst_mul->U.I.SrcReg[0].Swizzle =
198 RC_MAKE_SWIZZLE_SMEAR(GET_SWZ(inst->U.I.SrcReg[0].Swizzle, 2));
199 if (inst->U.I.Opcode == RC_OPCODE_TXP) {
200 inst_mul->U.I.SrcReg[1].File = RC_FILE_TEMPORARY;
201 inst_mul->U.I.SrcReg[1].Index = tmp_sum;
202 inst_mul->U.I.SrcReg[1].Swizzle = RC_SWIZZLE_WWWW;
203 }
204
205 /* Add the depth texture value. */
206 inst_add = rc_insert_new_instruction(c, inst_mul);
207 inst_add->U.I.Opcode = RC_OPCODE_ADD;
208 inst_add->U.I.DstReg.File = RC_FILE_TEMPORARY;
209 inst_add->U.I.DstReg.Index = tmp_sum;
210 inst_add->U.I.DstReg.WriteMask = RC_MASK_W;
211 inst_add->U.I.SrcReg[0].File = RC_FILE_TEMPORARY;
212 inst_add->U.I.SrcReg[0].Index = tmp_sum;
213 inst_add->U.I.SrcReg[0].Swizzle = RC_SWIZZLE_WWWW;
214 inst_add->U.I.SrcReg[1].File = RC_FILE_TEMPORARY;
215 inst_add->U.I.SrcReg[1].Index = tmp_texsample;
216 inst_add->U.I.SrcReg[1].Swizzle = RC_SWIZZLE_XXXX;
217
218 /* Note that SrcReg[0] is r, SrcReg[1] is tex and:
219 * LESS: r < tex <=> -tex+r < 0
220 * GEQUAL: r >= tex <=> not (-tex+r < 0)
221 * GREATER: r > tex <=> tex-r < 0
222 * LEQUAL: r <= tex <=> not ( tex-r < 0)
223 * EQUAL: GEQUAL
224 * NOTEQUAL:LESS
225 */
226
227 /* This negates either r or tex: */
228 if (comparefunc == RC_COMPARE_FUNC_LESS || comparefunc == RC_COMPARE_FUNC_GEQUAL ||
229 comparefunc == RC_COMPARE_FUNC_EQUAL || comparefunc == RC_COMPARE_FUNC_NOTEQUAL)
230 inst_add->U.I.SrcReg[1].Negate = inst_add->U.I.SrcReg[1].Negate ^ RC_MASK_XYZW;
231 else
232 inst_add->U.I.SrcReg[0].Negate = inst_add->U.I.SrcReg[0].Negate ^ RC_MASK_XYZW;
233
234 /* This negates the whole expresion: */
235 if (comparefunc == RC_COMPARE_FUNC_LESS || comparefunc == RC_COMPARE_FUNC_GREATER ||
236 comparefunc == RC_COMPARE_FUNC_NOTEQUAL) {
237 pass = 1;
238 fail = 2;
239 } else {
240 pass = 2;
241 fail = 1;
242 }
243
244 inst_cmp = rc_insert_new_instruction(c, inst_add);
245 inst_cmp->U.I.Opcode = RC_OPCODE_CMP;
246 inst_cmp->U.I.SaturateMode = saturate_mode;
247 inst_cmp->U.I.DstReg = output_reg;
248 inst_cmp->U.I.SrcReg[0].File = RC_FILE_TEMPORARY;
249 inst_cmp->U.I.SrcReg[0].Index = tmp_sum;
250 inst_cmp->U.I.SrcReg[0].Swizzle =
251 combine_swizzles(RC_SWIZZLE_WWWW,
252 compiler->state.unit[inst->U.I.TexSrcUnit].texture_swizzle);
253 inst_cmp->U.I.SrcReg[pass] = shadow_pass_value(compiler, inst->U.I.TexSrcUnit);
254 inst_cmp->U.I.SrcReg[fail] = shadow_fail_value(compiler, inst->U.I.TexSrcUnit);
255
256 assert(tmp_texsample != tmp_sum);
257 }
258 }
259
260 /* R300 cannot sample from rectangles and the wrap mode fallback needs
261 * normalized coordinates anyway. */
262 if (inst->U.I.Opcode != RC_OPCODE_KIL &&
263 is_rect && (!c->is_r500 || wrapmode != RC_WRAP_NONE)) {
264 scale_texcoords(compiler, inst, RC_STATE_R300_TEXRECT_FACTOR);
265 inst->U.I.TexSrcTarget = RC_TEXTURE_2D;
266 }
267
268 /* Divide by W if needed. */
269 if (inst->U.I.Opcode == RC_OPCODE_TXP &&
270 (wrapmode == RC_WRAP_REPEAT || wrapmode == RC_WRAP_MIRRORED_REPEAT ||
271 compiler->state.unit[inst->U.I.TexSrcUnit].clamp_and_scale_before_fetch)) {
272 projective_divide(compiler, inst);
273 }
274
275 /* Texture wrap modes don't work on NPOT textures.
276 *
277 * Non-wrapped/clamped texcoords with NPOT are free in HW. Repeat and
278 * mirroring are not. If we need to repeat, we do:
279 *
280 * MUL temp, texcoord, <scaling factor constant>
281 * FRC temp, temp ; Discard integer portion of coords
282 *
283 * This gives us coords in [0, 1].
284 *
285 * Mirroring is trickier. We're going to start out like repeat:
286 *
287 * MUL temp, texcoord, <scaling factor constant> ; De-mirror across axes
288 * MUL temp, temp, 0.5 ; Pattern repeats in [0, 2]
289 * ; so scale to [0, 1]
290 * FRC temp, temp ; Make the pattern repeat
291 * MAD temp, temp, 2, -1 ; Move the pattern to [-1, 1]
292 * ADD temp, 1, -abs(temp) ; Now comes a neat trick: use abs to mirror the pattern.
293 * ; The pattern is backwards, so reverse it (1-x).
294 *
295 * This gives us coords in [0, 1].
296 *
297 * ~ C & M. ;)
298 */
299 if (inst->U.I.Opcode != RC_OPCODE_KIL &&
300 wrapmode != RC_WRAP_NONE) {
301 struct rc_instruction *inst_mov;
302 unsigned temp = rc_find_free_temporary(c);
303
304 if (wrapmode == RC_WRAP_REPEAT) {
305 /* Both instructions will be paired up. */
306 struct rc_instruction *inst_frc = rc_insert_new_instruction(c, inst->Prev);
307
308 inst_frc->U.I.Opcode = RC_OPCODE_FRC;
309 inst_frc->U.I.DstReg.File = RC_FILE_TEMPORARY;
310 inst_frc->U.I.DstReg.Index = temp;
311 inst_frc->U.I.DstReg.WriteMask = RC_MASK_XYZ;
312 inst_frc->U.I.SrcReg[0] = inst->U.I.SrcReg[0];
313 } else if (wrapmode == RC_WRAP_MIRRORED_REPEAT) {
314 /*
315 * Function:
316 * f(v) = 1 - abs(frac(v * 0.5) * 2 - 1)
317 *
318 * Code:
319 * MUL temp, src0, 0.5
320 * FRC temp, temp
321 * MAD temp, temp, 2, -1
322 * ADD temp, 1, -abs(temp)
323 */
324
325 struct rc_instruction *inst_mul, *inst_frc, *inst_mad, *inst_add;
326 unsigned two, two_swizzle;
327
328 inst_mul = rc_insert_new_instruction(c, inst->Prev);
329
330 inst_mul->U.I.Opcode = RC_OPCODE_MUL;
331 inst_mul->U.I.DstReg.File = RC_FILE_TEMPORARY;
332 inst_mul->U.I.DstReg.Index = temp;
333 inst_mul->U.I.DstReg.WriteMask = RC_MASK_XYZ;
334 inst_mul->U.I.SrcReg[0] = inst->U.I.SrcReg[0];
335 inst_mul->U.I.SrcReg[1].Swizzle = RC_SWIZZLE_HHHH;
336
337 inst_frc = rc_insert_new_instruction(c, inst->Prev);
338
339 inst_frc->U.I.Opcode = RC_OPCODE_FRC;
340 inst_frc->U.I.DstReg.File = RC_FILE_TEMPORARY;
341 inst_frc->U.I.DstReg.Index = temp;
342 inst_frc->U.I.DstReg.WriteMask = RC_MASK_XYZ;
343 inst_frc->U.I.SrcReg[0].File = RC_FILE_TEMPORARY;
344 inst_frc->U.I.SrcReg[0].Index = temp;
345 inst_frc->U.I.SrcReg[0].Swizzle = RC_SWIZZLE_XYZ0;
346
347 two = rc_constants_add_immediate_scalar(&c->Program.Constants, 2, &two_swizzle);
348 inst_mad = rc_insert_new_instruction(c, inst->Prev);
349
350 inst_mad->U.I.Opcode = RC_OPCODE_MAD;
351 inst_mad->U.I.DstReg.File = RC_FILE_TEMPORARY;
352 inst_mad->U.I.DstReg.Index = temp;
353 inst_mad->U.I.DstReg.WriteMask = RC_MASK_XYZ;
354 inst_mad->U.I.SrcReg[0].File = RC_FILE_TEMPORARY;
355 inst_mad->U.I.SrcReg[0].Index = temp;
356 inst_mad->U.I.SrcReg[0].Swizzle = RC_SWIZZLE_XYZ0;
357 inst_mad->U.I.SrcReg[1].File = RC_FILE_CONSTANT;
358 inst_mad->U.I.SrcReg[1].Index = two;
359 inst_mad->U.I.SrcReg[1].Swizzle = two_swizzle;
360 inst_mad->U.I.SrcReg[2].Swizzle = RC_SWIZZLE_1111;
361 inst_mad->U.I.SrcReg[2].Negate = RC_MASK_XYZ;
362
363 inst_add = rc_insert_new_instruction(c, inst->Prev);
364
365 inst_add->U.I.Opcode = RC_OPCODE_ADD;
366 inst_add->U.I.DstReg.File = RC_FILE_TEMPORARY;
367 inst_add->U.I.DstReg.Index = temp;
368 inst_add->U.I.DstReg.WriteMask = RC_MASK_XYZ;
369 inst_add->U.I.SrcReg[0].Swizzle = RC_SWIZZLE_1111;
370 inst_add->U.I.SrcReg[1].File = RC_FILE_TEMPORARY;
371 inst_add->U.I.SrcReg[1].Index = temp;
372 inst_add->U.I.SrcReg[1].Swizzle = RC_SWIZZLE_XYZ0;
373 inst_add->U.I.SrcReg[1].Abs = 1;
374 inst_add->U.I.SrcReg[1].Negate = RC_MASK_XYZ;
375 } else if (wrapmode == RC_WRAP_MIRRORED_CLAMP) {
376 /*
377 * Mirrored clamp modes are bloody simple, we just use abs
378 * to mirror [0, 1] into [-1, 0]. This works for
379 * all modes i.e. CLAMP, CLAMP_TO_EDGE, and CLAMP_TO_BORDER.
380 */
381 struct rc_instruction *inst_mov;
382
383 inst_mov = rc_insert_new_instruction(c, inst->Prev);
384
385 inst_mov->U.I.Opcode = RC_OPCODE_MOV;
386 inst_mov->U.I.DstReg.File = RC_FILE_TEMPORARY;
387 inst_mov->U.I.DstReg.Index = temp;
388 inst_mov->U.I.DstReg.WriteMask = RC_MASK_XYZ;
389 inst_mov->U.I.SrcReg[0] = inst->U.I.SrcReg[0];
390 inst_mov->U.I.SrcReg[0].Abs = 1;
391 }
392
393 /* Preserve W for TXP/TXB. */
394 inst_mov = rc_insert_new_instruction(c, inst->Prev);
395
396 inst_mov->U.I.Opcode = RC_OPCODE_MOV;
397 inst_mov->U.I.DstReg.File = RC_FILE_TEMPORARY;
398 inst_mov->U.I.DstReg.Index = temp;
399 inst_mov->U.I.DstReg.WriteMask = RC_MASK_W;
400 inst_mov->U.I.SrcReg[0] = inst->U.I.SrcReg[0];
401
402 reset_srcreg(&inst->U.I.SrcReg[0]);
403 inst->U.I.SrcReg[0].File = RC_FILE_TEMPORARY;
404 inst->U.I.SrcReg[0].Index = temp;
405 }
406
407 /* NPOT -> POT conversion for 3D textures. */
408 if (inst->U.I.Opcode != RC_OPCODE_KIL &&
409 compiler->state.unit[inst->U.I.TexSrcUnit].clamp_and_scale_before_fetch) {
410 struct rc_instruction *inst_mov;
411 unsigned temp = rc_find_free_temporary(c);
412
413 /* Saturate XYZ. */
414 inst_mov = rc_insert_new_instruction(c, inst->Prev);
415 inst_mov->U.I.Opcode = RC_OPCODE_MOV;
416 inst_mov->U.I.SaturateMode = RC_SATURATE_ZERO_ONE;
417 inst_mov->U.I.DstReg.File = RC_FILE_TEMPORARY;
418 inst_mov->U.I.DstReg.Index = temp;
419 inst_mov->U.I.DstReg.WriteMask = RC_MASK_XYZ;
420 inst_mov->U.I.SrcReg[0] = inst->U.I.SrcReg[0];
421
422 /* Copy W. */
423 inst_mov = rc_insert_new_instruction(c, inst->Prev);
424 inst_mov->U.I.Opcode = RC_OPCODE_MOV;
425 inst_mov->U.I.DstReg.File = RC_FILE_TEMPORARY;
426 inst_mov->U.I.DstReg.Index = temp;
427 inst_mov->U.I.DstReg.WriteMask = RC_MASK_W;
428 inst_mov->U.I.SrcReg[0] = inst->U.I.SrcReg[0];
429
430 reset_srcreg(&inst->U.I.SrcReg[0]);
431 inst->U.I.SrcReg[0].File = RC_FILE_TEMPORARY;
432 inst->U.I.SrcReg[0].Index = temp;
433
434 scale_texcoords(compiler, inst, RC_STATE_R300_TEXSCALE_FACTOR);
435 }
436
437 /* Convert SNORM-encoded ATI1N sampled as UNORM to SNORM.
438 * Formula: dst = tex > 0.5 ? tex*2-2 : tex*2
439 */
440 if (inst->U.I.Opcode != RC_OPCODE_KIL &&
441 compiler->state.unit[inst->U.I.TexSrcUnit].convert_unorm_to_snorm) {
442 unsigned two, two_swizzle;
443 struct rc_instruction *inst_mul, *inst_mad, *inst_cnd;
444
445 two = rc_constants_add_immediate_scalar(&c->Program.Constants, 2.35, &two_swizzle);
446
447 inst_mul = rc_insert_new_instruction(c, inst);
448 inst_mul->U.I.Opcode = RC_OPCODE_MUL;
449 inst_mul->U.I.DstReg.File = RC_FILE_TEMPORARY;
450 inst_mul->U.I.DstReg.Index = rc_find_free_temporary(c);
451 inst_mul->U.I.SrcReg[0].File = RC_FILE_TEMPORARY;
452 inst_mul->U.I.SrcReg[0].Index = rc_find_free_temporary(c); /* redirected TEX output */
453 inst_mul->U.I.SrcReg[1].File = RC_FILE_CONSTANT; /* 2 */
454 inst_mul->U.I.SrcReg[1].Index = two;
455 inst_mul->U.I.SrcReg[1].Swizzle = two_swizzle;
456
457 inst_mad = rc_insert_new_instruction(c, inst_mul);
458 inst_mad->U.I.Opcode = RC_OPCODE_MAD;
459 inst_mad->U.I.DstReg.File = RC_FILE_TEMPORARY;
460 inst_mad->U.I.DstReg.Index = rc_find_free_temporary(c);
461 inst_mad->U.I.SrcReg[0] = inst_mul->U.I.SrcReg[0]; /* redirected TEX output */
462 inst_mad->U.I.SrcReg[1] = inst_mul->U.I.SrcReg[1]; /* 2 */
463 inst_mad->U.I.SrcReg[2] = inst_mul->U.I.SrcReg[1]; /* 2 */
464 inst_mad->U.I.SrcReg[2].Negate = RC_MASK_XYZW;
465
466 inst_cnd = rc_insert_new_instruction(c, inst_mad);
467 inst_cnd->U.I.Opcode = RC_OPCODE_CND;
468 inst_cnd->U.I.SaturateMode = inst->U.I.SaturateMode;
469 inst_cnd->U.I.DstReg = inst->U.I.DstReg;
470 inst_cnd->U.I.SrcReg[0].File = RC_FILE_TEMPORARY;
471 inst_cnd->U.I.SrcReg[0].Index = inst_mad->U.I.DstReg.Index;
472 inst_cnd->U.I.SrcReg[0].Swizzle = compiler->state.unit[inst->U.I.TexSrcUnit].texture_swizzle;
473 inst_cnd->U.I.SrcReg[1].File = RC_FILE_TEMPORARY;
474 inst_cnd->U.I.SrcReg[1].Index = inst_mul->U.I.DstReg.Index;
475 inst_cnd->U.I.SrcReg[1].Swizzle = compiler->state.unit[inst->U.I.TexSrcUnit].texture_swizzle;
476 inst_cnd->U.I.SrcReg[2] = inst_mul->U.I.SrcReg[0]; /* redirected TEX output */
477
478 inst->U.I.SaturateMode = 0;
479 inst->U.I.DstReg.File = RC_FILE_TEMPORARY;
480 inst->U.I.DstReg.Index = inst_mul->U.I.SrcReg[0].Index;
481 inst->U.I.DstReg.WriteMask = RC_MASK_XYZW;
482 }
483
484 /* Cannot write texture to output registers or with saturate (all chips),
485 * or with masks (non-r500). */
486 if (inst->U.I.Opcode != RC_OPCODE_KIL &&
487 (inst->U.I.DstReg.File != RC_FILE_TEMPORARY ||
488 inst->U.I.SaturateMode ||
489 (!c->is_r500 && inst->U.I.DstReg.WriteMask != RC_MASK_XYZW))) {
490 struct rc_instruction * inst_mov = rc_insert_new_instruction(c, inst);
491
492 inst_mov->U.I.Opcode = RC_OPCODE_MOV;
493 inst_mov->U.I.SaturateMode = inst->U.I.SaturateMode;
494 inst_mov->U.I.DstReg = inst->U.I.DstReg;
495 inst_mov->U.I.SrcReg[0].File = RC_FILE_TEMPORARY;
496 inst_mov->U.I.SrcReg[0].Index = rc_find_free_temporary(c);
497
498 inst->U.I.SaturateMode = 0;
499 inst->U.I.DstReg.File = RC_FILE_TEMPORARY;
500 inst->U.I.DstReg.Index = inst_mov->U.I.SrcReg[0].Index;
501 inst->U.I.DstReg.WriteMask = RC_MASK_XYZW;
502 }
503
504 /* Cannot read texture coordinate from constants file */
505 if (inst->U.I.SrcReg[0].File != RC_FILE_TEMPORARY && inst->U.I.SrcReg[0].File != RC_FILE_INPUT) {
506 struct rc_instruction * inst_mov = rc_insert_new_instruction(c, inst->Prev);
507
508 inst_mov->U.I.Opcode = RC_OPCODE_MOV;
509 inst_mov->U.I.DstReg.File = RC_FILE_TEMPORARY;
510 inst_mov->U.I.DstReg.Index = rc_find_free_temporary(c);
511 inst_mov->U.I.SrcReg[0] = inst->U.I.SrcReg[0];
512
513 reset_srcreg(&inst->U.I.SrcReg[0]);
514 inst->U.I.SrcReg[0].File = RC_FILE_TEMPORARY;
515 inst->U.I.SrcReg[0].Index = inst_mov->U.I.DstReg.Index;
516 }
517
518 return 1;
519 }
520