1 /**************************************************************************
2 *
3 * Copyright 2008 VMware, Inc.
4 * All Rights Reserved.
5 * Copyright 2008 VMware, Inc. All rights Reserved.
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining a
8 * copy of this software and associated documentation files (the
9 * "Software"), to deal in the Software without restriction, including
10 * without limitation the rights to use, copy, modify, merge, publish,
11 * distribute, sub license, and/or sell copies of the Software, and to
12 * permit persons to whom the Software is furnished to do so, subject to
13 * the following conditions:
14 *
15 * The above copyright notice and this permission notice (including the
16 * next paragraph) shall be included in all copies or substantial portions
17 * of the Software.
18 *
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
20 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
21 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
22 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
23 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
24 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
25 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 *
27 **************************************************************************/
28
29 /**
30 * TGSI program scan utility.
31 * Used to determine which registers and instructions are used by a shader.
32 *
33 * Authors: Brian Paul
34 */
35
36
37 #include "util/u_debug.h"
38 #include "util/u_math.h"
39 #include "util/u_memory.h"
40 #include "util/u_prim.h"
41 #include "tgsi/tgsi_info.h"
42 #include "tgsi/tgsi_parse.h"
43 #include "tgsi/tgsi_util.h"
44 #include "tgsi/tgsi_scan.h"
45
46
47 static bool
is_memory_file(unsigned file)48 is_memory_file(unsigned file)
49 {
50 return file == TGSI_FILE_SAMPLER ||
51 file == TGSI_FILE_SAMPLER_VIEW ||
52 file == TGSI_FILE_IMAGE ||
53 file == TGSI_FILE_BUFFER;
54 }
55
56
57 static bool
is_mem_query_inst(unsigned opcode)58 is_mem_query_inst(unsigned opcode)
59 {
60 return opcode == TGSI_OPCODE_RESQ ||
61 opcode == TGSI_OPCODE_TXQ ||
62 opcode == TGSI_OPCODE_TXQS ||
63 opcode == TGSI_OPCODE_LODQ;
64 }
65
66 /**
67 * Is the opcode a "true" texture instruction which samples from a
68 * texture map?
69 */
70 static bool
is_texture_inst(unsigned opcode)71 is_texture_inst(unsigned opcode)
72 {
73 return (!is_mem_query_inst(opcode) &&
74 tgsi_get_opcode_info(opcode)->is_tex);
75 }
76
77
78 /**
79 * Is the opcode an instruction which computes a derivative explicitly or
80 * implicitly?
81 */
82 static bool
computes_derivative(unsigned opcode)83 computes_derivative(unsigned opcode)
84 {
85 if (tgsi_get_opcode_info(opcode)->is_tex) {
86 return opcode != TGSI_OPCODE_TG4 &&
87 opcode != TGSI_OPCODE_TXD &&
88 opcode != TGSI_OPCODE_TXF &&
89 opcode != TGSI_OPCODE_TXF_LZ &&
90 opcode != TGSI_OPCODE_TEX_LZ &&
91 opcode != TGSI_OPCODE_TXL &&
92 opcode != TGSI_OPCODE_TXL2 &&
93 opcode != TGSI_OPCODE_TXQ &&
94 opcode != TGSI_OPCODE_TXQS;
95 }
96
97 return opcode == TGSI_OPCODE_DDX || opcode == TGSI_OPCODE_DDX_FINE ||
98 opcode == TGSI_OPCODE_DDY || opcode == TGSI_OPCODE_DDY_FINE ||
99 opcode == TGSI_OPCODE_SAMPLE ||
100 opcode == TGSI_OPCODE_SAMPLE_B ||
101 opcode == TGSI_OPCODE_SAMPLE_C;
102 }
103
104
105 static void
scan_src_operand(struct tgsi_shader_info * info,const struct tgsi_full_instruction * fullinst,const struct tgsi_full_src_register * src,unsigned src_index,unsigned usage_mask_after_swizzle,bool is_interp_instruction,bool * is_mem_inst)106 scan_src_operand(struct tgsi_shader_info *info,
107 const struct tgsi_full_instruction *fullinst,
108 const struct tgsi_full_src_register *src,
109 unsigned src_index,
110 unsigned usage_mask_after_swizzle,
111 bool is_interp_instruction,
112 bool *is_mem_inst)
113 {
114 int ind = src->Register.Index;
115
116 if (info->processor == PIPE_SHADER_COMPUTE &&
117 src->Register.File == TGSI_FILE_SYSTEM_VALUE) {
118 unsigned name, mask;
119
120 name = info->system_value_semantic_name[src->Register.Index];
121
122 switch (name) {
123 case TGSI_SEMANTIC_THREAD_ID:
124 case TGSI_SEMANTIC_BLOCK_ID:
125 mask = usage_mask_after_swizzle & TGSI_WRITEMASK_XYZ;
126 while (mask) {
127 unsigned i = u_bit_scan(&mask);
128
129 if (name == TGSI_SEMANTIC_THREAD_ID)
130 info->uses_thread_id[i] = true;
131 else
132 info->uses_block_id[i] = true;
133 }
134 break;
135 case TGSI_SEMANTIC_BLOCK_SIZE:
136 /* The block size is translated to IMM with a fixed block size. */
137 if (info->properties[TGSI_PROPERTY_CS_FIXED_BLOCK_WIDTH] == 0)
138 info->uses_block_size = true;
139 break;
140 case TGSI_SEMANTIC_GRID_SIZE:
141 info->uses_grid_size = true;
142 break;
143 }
144 }
145
146 /* Mark which inputs are effectively used */
147 if (src->Register.File == TGSI_FILE_INPUT) {
148 if (src->Register.Indirect) {
149 for (ind = 0; ind < info->num_inputs; ++ind) {
150 info->input_usage_mask[ind] |= usage_mask_after_swizzle;
151 }
152 } else {
153 assert(ind >= 0);
154 assert(ind < PIPE_MAX_SHADER_INPUTS);
155 info->input_usage_mask[ind] |= usage_mask_after_swizzle;
156 }
157
158 if (info->processor == PIPE_SHADER_FRAGMENT) {
159 unsigned name, index, input;
160
161 if (src->Register.Indirect && src->Indirect.ArrayID)
162 input = info->input_array_first[src->Indirect.ArrayID];
163 else
164 input = src->Register.Index;
165
166 name = info->input_semantic_name[input];
167 index = info->input_semantic_index[input];
168
169 if (name == TGSI_SEMANTIC_POSITION &&
170 usage_mask_after_swizzle & TGSI_WRITEMASK_Z)
171 info->reads_z = true;
172
173 if (name == TGSI_SEMANTIC_COLOR)
174 info->colors_read |= usage_mask_after_swizzle << (index * 4);
175
176 /* Process only interpolated varyings. Don't include POSITION.
177 * Don't include integer varyings, because they are not
178 * interpolated. Don't process inputs interpolated by INTERP
179 * opcodes. Those are tracked separately.
180 */
181 if ((!is_interp_instruction || src_index != 0) &&
182 (name == TGSI_SEMANTIC_GENERIC ||
183 name == TGSI_SEMANTIC_TEXCOORD ||
184 name == TGSI_SEMANTIC_COLOR ||
185 name == TGSI_SEMANTIC_BCOLOR ||
186 name == TGSI_SEMANTIC_FOG ||
187 name == TGSI_SEMANTIC_CLIPDIST)) {
188 switch (info->input_interpolate[input]) {
189 case TGSI_INTERPOLATE_COLOR:
190 case TGSI_INTERPOLATE_PERSPECTIVE:
191 switch (info->input_interpolate_loc[input]) {
192 case TGSI_INTERPOLATE_LOC_CENTER:
193 info->uses_persp_center = TRUE;
194 break;
195 case TGSI_INTERPOLATE_LOC_CENTROID:
196 info->uses_persp_centroid = TRUE;
197 break;
198 case TGSI_INTERPOLATE_LOC_SAMPLE:
199 info->uses_persp_sample = TRUE;
200 break;
201 }
202 break;
203 case TGSI_INTERPOLATE_LINEAR:
204 switch (info->input_interpolate_loc[input]) {
205 case TGSI_INTERPOLATE_LOC_CENTER:
206 info->uses_linear_center = TRUE;
207 break;
208 case TGSI_INTERPOLATE_LOC_CENTROID:
209 info->uses_linear_centroid = TRUE;
210 break;
211 case TGSI_INTERPOLATE_LOC_SAMPLE:
212 info->uses_linear_sample = TRUE;
213 break;
214 }
215 break;
216 /* TGSI_INTERPOLATE_CONSTANT doesn't do any interpolation. */
217 }
218 }
219 }
220 }
221
222 if (info->processor == PIPE_SHADER_TESS_CTRL &&
223 src->Register.File == TGSI_FILE_OUTPUT) {
224 unsigned input;
225
226 if (src->Register.Indirect && src->Indirect.ArrayID)
227 input = info->output_array_first[src->Indirect.ArrayID];
228 else
229 input = src->Register.Index;
230
231 switch (info->output_semantic_name[input]) {
232 case TGSI_SEMANTIC_PATCH:
233 info->reads_perpatch_outputs = true;
234 break;
235 case TGSI_SEMANTIC_TESSINNER:
236 case TGSI_SEMANTIC_TESSOUTER:
237 info->reads_tessfactor_outputs = true;
238 break;
239 default:
240 info->reads_pervertex_outputs = true;
241 }
242 }
243
244 /* check for indirect register reads */
245 if (src->Register.Indirect) {
246 info->indirect_files |= (1 << src->Register.File);
247 info->indirect_files_read |= (1 << src->Register.File);
248
249 /* record indirect constant buffer indexing */
250 if (src->Register.File == TGSI_FILE_CONSTANT) {
251 if (src->Register.Dimension) {
252 if (src->Dimension.Indirect)
253 info->const_buffers_indirect = info->const_buffers_declared;
254 else
255 info->const_buffers_indirect |= 1u << src->Dimension.Index;
256 } else {
257 info->const_buffers_indirect |= 1;
258 }
259 }
260 }
261
262 if (src->Register.Dimension && src->Dimension.Indirect)
263 info->dim_indirect_files |= 1u << src->Register.File;
264
265 /* Texture samplers */
266 if (src->Register.File == TGSI_FILE_SAMPLER) {
267 const unsigned index = src->Register.Index;
268
269 assert(fullinst->Instruction.Texture);
270 assert(index < ARRAY_SIZE(info->is_msaa_sampler));
271 assert(index < PIPE_MAX_SAMPLERS);
272
273 if (is_texture_inst(fullinst->Instruction.Opcode)) {
274 const unsigned target = fullinst->Texture.Texture;
275 assert(target < TGSI_TEXTURE_UNKNOWN);
276 /* for texture instructions, check that the texture instruction
277 * target matches the previous sampler view declaration (if there
278 * was one.)
279 */
280 if (info->sampler_targets[index] == TGSI_TEXTURE_UNKNOWN) {
281 /* probably no sampler view declaration */
282 info->sampler_targets[index] = target;
283 } else {
284 /* Make sure the texture instruction's sampler/target info
285 * agrees with the sampler view declaration.
286 */
287 assert(info->sampler_targets[index] == target);
288 }
289 /* MSAA samplers */
290 if (target == TGSI_TEXTURE_2D_MSAA ||
291 target == TGSI_TEXTURE_2D_ARRAY_MSAA) {
292 info->is_msaa_sampler[src->Register.Index] = TRUE;
293 }
294 }
295 }
296
297 if (is_memory_file(src->Register.File) &&
298 !is_mem_query_inst(fullinst->Instruction.Opcode)) {
299 *is_mem_inst = true;
300
301 if (tgsi_get_opcode_info(fullinst->Instruction.Opcode)->is_store) {
302 info->writes_memory = TRUE;
303
304 if (src->Register.File == TGSI_FILE_IMAGE) {
305 if (src->Register.Indirect)
306 info->images_atomic = info->images_declared;
307 else
308 info->images_atomic |= 1 << src->Register.Index;
309 } else if (src->Register.File == TGSI_FILE_BUFFER) {
310 if (src->Register.Indirect)
311 info->shader_buffers_atomic = info->shader_buffers_declared;
312 else
313 info->shader_buffers_atomic |= 1 << src->Register.Index;
314 }
315 } else {
316 if (src->Register.File == TGSI_FILE_IMAGE) {
317 if (src->Register.Indirect)
318 info->images_load = info->images_declared;
319 else
320 info->images_load |= 1 << src->Register.Index;
321 } else if (src->Register.File == TGSI_FILE_BUFFER) {
322 if (src->Register.Indirect)
323 info->shader_buffers_load = info->shader_buffers_declared;
324 else
325 info->shader_buffers_load |= 1 << src->Register.Index;
326 }
327 }
328 }
329 }
330
331
332 static void
scan_instruction(struct tgsi_shader_info * info,const struct tgsi_full_instruction * fullinst,unsigned * current_depth)333 scan_instruction(struct tgsi_shader_info *info,
334 const struct tgsi_full_instruction *fullinst,
335 unsigned *current_depth)
336 {
337 unsigned i;
338 bool is_mem_inst = false;
339 bool is_interp_instruction = false;
340 unsigned sampler_src;
341
342 assert(fullinst->Instruction.Opcode < TGSI_OPCODE_LAST);
343 info->opcode_count[fullinst->Instruction.Opcode]++;
344
345 switch (fullinst->Instruction.Opcode) {
346 case TGSI_OPCODE_IF:
347 case TGSI_OPCODE_UIF:
348 case TGSI_OPCODE_BGNLOOP:
349 (*current_depth)++;
350 info->max_depth = MAX2(info->max_depth, *current_depth);
351 break;
352 case TGSI_OPCODE_ENDIF:
353 case TGSI_OPCODE_ENDLOOP:
354 (*current_depth)--;
355 break;
356 case TGSI_OPCODE_TEX:
357 case TGSI_OPCODE_TEX_LZ:
358 case TGSI_OPCODE_TXB:
359 case TGSI_OPCODE_TXD:
360 case TGSI_OPCODE_TXL:
361 case TGSI_OPCODE_TXP:
362 case TGSI_OPCODE_TXQ:
363 case TGSI_OPCODE_TXQS:
364 case TGSI_OPCODE_TXF:
365 case TGSI_OPCODE_TXF_LZ:
366 case TGSI_OPCODE_TEX2:
367 case TGSI_OPCODE_TXB2:
368 case TGSI_OPCODE_TXL2:
369 case TGSI_OPCODE_TG4:
370 case TGSI_OPCODE_LODQ:
371 sampler_src = fullinst->Instruction.NumSrcRegs - 1;
372 if (fullinst->Src[sampler_src].Register.File != TGSI_FILE_SAMPLER)
373 info->uses_bindless_samplers = true;
374 break;
375 case TGSI_OPCODE_RESQ:
376 case TGSI_OPCODE_LOAD:
377 case TGSI_OPCODE_ATOMUADD:
378 case TGSI_OPCODE_ATOMXCHG:
379 case TGSI_OPCODE_ATOMCAS:
380 case TGSI_OPCODE_ATOMAND:
381 case TGSI_OPCODE_ATOMOR:
382 case TGSI_OPCODE_ATOMXOR:
383 case TGSI_OPCODE_ATOMUMIN:
384 case TGSI_OPCODE_ATOMUMAX:
385 case TGSI_OPCODE_ATOMIMIN:
386 case TGSI_OPCODE_ATOMIMAX:
387 if (tgsi_is_bindless_image_file(fullinst->Src[0].Register.File))
388 info->uses_bindless_images = true;
389 break;
390 case TGSI_OPCODE_STORE:
391 if (tgsi_is_bindless_image_file(fullinst->Dst[0].Register.File))
392 info->uses_bindless_images = true;
393 break;
394 default:
395 break;
396 }
397
398 if (fullinst->Instruction.Opcode == TGSI_OPCODE_INTERP_CENTROID ||
399 fullinst->Instruction.Opcode == TGSI_OPCODE_INTERP_OFFSET ||
400 fullinst->Instruction.Opcode == TGSI_OPCODE_INTERP_SAMPLE) {
401 const struct tgsi_full_src_register *src0 = &fullinst->Src[0];
402 unsigned input;
403
404 is_interp_instruction = true;
405
406 if (src0->Register.Indirect && src0->Indirect.ArrayID)
407 input = info->input_array_first[src0->Indirect.ArrayID];
408 else
409 input = src0->Register.Index;
410
411 /* For the INTERP opcodes, the interpolation is always
412 * PERSPECTIVE unless LINEAR is specified.
413 */
414 switch (info->input_interpolate[input]) {
415 case TGSI_INTERPOLATE_COLOR:
416 case TGSI_INTERPOLATE_CONSTANT:
417 case TGSI_INTERPOLATE_PERSPECTIVE:
418 switch (fullinst->Instruction.Opcode) {
419 case TGSI_OPCODE_INTERP_CENTROID:
420 info->uses_persp_opcode_interp_centroid = TRUE;
421 break;
422 case TGSI_OPCODE_INTERP_OFFSET:
423 info->uses_persp_opcode_interp_offset = TRUE;
424 break;
425 case TGSI_OPCODE_INTERP_SAMPLE:
426 info->uses_persp_opcode_interp_sample = TRUE;
427 break;
428 }
429 break;
430
431 case TGSI_INTERPOLATE_LINEAR:
432 switch (fullinst->Instruction.Opcode) {
433 case TGSI_OPCODE_INTERP_CENTROID:
434 info->uses_linear_opcode_interp_centroid = TRUE;
435 break;
436 case TGSI_OPCODE_INTERP_OFFSET:
437 info->uses_linear_opcode_interp_offset = TRUE;
438 break;
439 case TGSI_OPCODE_INTERP_SAMPLE:
440 info->uses_linear_opcode_interp_sample = TRUE;
441 break;
442 }
443 break;
444 }
445 }
446
447 if ((fullinst->Instruction.Opcode >= TGSI_OPCODE_F2D &&
448 fullinst->Instruction.Opcode <= TGSI_OPCODE_DSSG) ||
449 fullinst->Instruction.Opcode == TGSI_OPCODE_DFMA ||
450 fullinst->Instruction.Opcode == TGSI_OPCODE_DDIV ||
451 fullinst->Instruction.Opcode == TGSI_OPCODE_D2U64 ||
452 fullinst->Instruction.Opcode == TGSI_OPCODE_D2I64 ||
453 fullinst->Instruction.Opcode == TGSI_OPCODE_U642D ||
454 fullinst->Instruction.Opcode == TGSI_OPCODE_I642D)
455 info->uses_doubles = TRUE;
456
457 for (i = 0; i < fullinst->Instruction.NumSrcRegs; i++) {
458 scan_src_operand(info, fullinst, &fullinst->Src[i], i,
459 tgsi_util_get_inst_usage_mask(fullinst, i),
460 is_interp_instruction, &is_mem_inst);
461
462 if (fullinst->Src[i].Register.Indirect) {
463 struct tgsi_full_src_register src = {{0}};
464
465 src.Register.File = fullinst->Src[i].Indirect.File;
466 src.Register.Index = fullinst->Src[i].Indirect.Index;
467
468 scan_src_operand(info, fullinst, &src, -1,
469 1 << fullinst->Src[i].Indirect.Swizzle,
470 false, NULL);
471 }
472
473 if (fullinst->Src[i].Register.Dimension &&
474 fullinst->Src[i].Dimension.Indirect) {
475 struct tgsi_full_src_register src = {{0}};
476
477 src.Register.File = fullinst->Src[i].DimIndirect.File;
478 src.Register.Index = fullinst->Src[i].DimIndirect.Index;
479
480 scan_src_operand(info, fullinst, &src, -1,
481 1 << fullinst->Src[i].DimIndirect.Swizzle,
482 false, NULL);
483 }
484 }
485
486 if (fullinst->Instruction.Texture) {
487 for (i = 0; i < fullinst->Texture.NumOffsets; i++) {
488 struct tgsi_full_src_register src = {{0}};
489
490 src.Register.File = fullinst->TexOffsets[i].File;
491 src.Register.Index = fullinst->TexOffsets[i].Index;
492
493 /* The usage mask is suboptimal but should be safe. */
494 scan_src_operand(info, fullinst, &src, -1,
495 (1 << fullinst->TexOffsets[i].SwizzleX) |
496 (1 << fullinst->TexOffsets[i].SwizzleY) |
497 (1 << fullinst->TexOffsets[i].SwizzleZ),
498 false, &is_mem_inst);
499 }
500 }
501
502 /* check for indirect register writes */
503 for (i = 0; i < fullinst->Instruction.NumDstRegs; i++) {
504 const struct tgsi_full_dst_register *dst = &fullinst->Dst[i];
505
506 if (dst->Register.Indirect) {
507 struct tgsi_full_src_register src = {{0}};
508
509 src.Register.File = dst->Indirect.File;
510 src.Register.Index = dst->Indirect.Index;
511
512 scan_src_operand(info, fullinst, &src, -1,
513 1 << dst->Indirect.Swizzle, false, NULL);
514
515 info->indirect_files |= (1 << dst->Register.File);
516 info->indirect_files_written |= (1 << dst->Register.File);
517 }
518
519 if (dst->Register.Dimension && dst->Dimension.Indirect) {
520 struct tgsi_full_src_register src = {{0}};
521
522 src.Register.File = dst->DimIndirect.File;
523 src.Register.Index = dst->DimIndirect.Index;
524
525 scan_src_operand(info, fullinst, &src, -1,
526 1 << dst->DimIndirect.Swizzle, false, NULL);
527
528 info->dim_indirect_files |= 1u << dst->Register.File;
529 }
530
531 if (is_memory_file(dst->Register.File)) {
532 assert(fullinst->Instruction.Opcode == TGSI_OPCODE_STORE);
533
534 is_mem_inst = true;
535 info->writes_memory = TRUE;
536
537 if (dst->Register.File == TGSI_FILE_IMAGE) {
538 if (dst->Register.Indirect)
539 info->images_store = info->images_declared;
540 else
541 info->images_store |= 1 << dst->Register.Index;
542 } else if (dst->Register.File == TGSI_FILE_BUFFER) {
543 if (dst->Register.Indirect)
544 info->shader_buffers_store = info->shader_buffers_declared;
545 else
546 info->shader_buffers_store |= 1 << dst->Register.Index;
547 }
548 }
549 }
550
551 if (is_mem_inst)
552 info->num_memory_instructions++;
553
554 if (computes_derivative(fullinst->Instruction.Opcode))
555 info->uses_derivatives = true;
556
557 info->num_instructions++;
558 }
559
560
561 static void
scan_declaration(struct tgsi_shader_info * info,const struct tgsi_full_declaration * fulldecl)562 scan_declaration(struct tgsi_shader_info *info,
563 const struct tgsi_full_declaration *fulldecl)
564 {
565 const uint file = fulldecl->Declaration.File;
566 const unsigned procType = info->processor;
567 uint reg;
568
569 if (fulldecl->Declaration.Array) {
570 unsigned array_id = fulldecl->Array.ArrayID;
571
572 switch (file) {
573 case TGSI_FILE_INPUT:
574 assert(array_id < ARRAY_SIZE(info->input_array_first));
575 info->input_array_first[array_id] = fulldecl->Range.First;
576 info->input_array_last[array_id] = fulldecl->Range.Last;
577 break;
578 case TGSI_FILE_OUTPUT:
579 assert(array_id < ARRAY_SIZE(info->output_array_first));
580 info->output_array_first[array_id] = fulldecl->Range.First;
581 info->output_array_last[array_id] = fulldecl->Range.Last;
582 break;
583 }
584 info->array_max[file] = MAX2(info->array_max[file], array_id);
585 }
586
587 for (reg = fulldecl->Range.First; reg <= fulldecl->Range.Last; reg++) {
588 unsigned semName = fulldecl->Semantic.Name;
589 unsigned semIndex = fulldecl->Semantic.Index +
590 (reg - fulldecl->Range.First);
591 int buffer;
592 unsigned index, target, type;
593
594 /* only first 32 regs will appear in this bitfield */
595 info->file_mask[file] |= (1 << reg);
596 info->file_count[file]++;
597 info->file_max[file] = MAX2(info->file_max[file], (int)reg);
598
599 switch (file) {
600 case TGSI_FILE_CONSTANT:
601 buffer = 0;
602
603 if (fulldecl->Declaration.Dimension)
604 buffer = fulldecl->Dim.Index2D;
605
606 info->const_file_max[buffer] =
607 MAX2(info->const_file_max[buffer], (int)reg);
608 info->const_buffers_declared |= 1u << buffer;
609 break;
610
611 case TGSI_FILE_IMAGE:
612 info->images_declared |= 1u << reg;
613 if (fulldecl->Image.Resource == TGSI_TEXTURE_BUFFER)
614 info->images_buffers |= 1 << reg;
615 break;
616
617 case TGSI_FILE_BUFFER:
618 info->shader_buffers_declared |= 1u << reg;
619 break;
620
621 case TGSI_FILE_INPUT:
622 info->input_semantic_name[reg] = (ubyte) semName;
623 info->input_semantic_index[reg] = (ubyte) semIndex;
624 info->input_interpolate[reg] = (ubyte)fulldecl->Interp.Interpolate;
625 info->input_interpolate_loc[reg] = (ubyte)fulldecl->Interp.Location;
626 info->input_cylindrical_wrap[reg] = (ubyte)fulldecl->Interp.CylindricalWrap;
627
628 /* Vertex shaders can have inputs with holes between them. */
629 info->num_inputs = MAX2(info->num_inputs, reg + 1);
630
631 switch (semName) {
632 case TGSI_SEMANTIC_PRIMID:
633 info->uses_primid = true;
634 break;
635 case TGSI_SEMANTIC_POSITION:
636 info->reads_position = true;
637 break;
638 case TGSI_SEMANTIC_FACE:
639 info->uses_frontface = true;
640 break;
641 }
642 break;
643
644 case TGSI_FILE_SYSTEM_VALUE:
645 index = fulldecl->Range.First;
646
647 info->system_value_semantic_name[index] = semName;
648 info->num_system_values = MAX2(info->num_system_values, index + 1);
649
650 switch (semName) {
651 case TGSI_SEMANTIC_INSTANCEID:
652 info->uses_instanceid = TRUE;
653 break;
654 case TGSI_SEMANTIC_VERTEXID:
655 info->uses_vertexid = TRUE;
656 break;
657 case TGSI_SEMANTIC_VERTEXID_NOBASE:
658 info->uses_vertexid_nobase = TRUE;
659 break;
660 case TGSI_SEMANTIC_BASEVERTEX:
661 info->uses_basevertex = TRUE;
662 break;
663 case TGSI_SEMANTIC_PRIMID:
664 info->uses_primid = TRUE;
665 break;
666 case TGSI_SEMANTIC_INVOCATIONID:
667 info->uses_invocationid = TRUE;
668 break;
669 case TGSI_SEMANTIC_POSITION:
670 info->reads_position = TRUE;
671 break;
672 case TGSI_SEMANTIC_FACE:
673 info->uses_frontface = TRUE;
674 break;
675 case TGSI_SEMANTIC_SAMPLEMASK:
676 info->reads_samplemask = TRUE;
677 break;
678 case TGSI_SEMANTIC_TESSINNER:
679 case TGSI_SEMANTIC_TESSOUTER:
680 info->reads_tess_factors = true;
681 break;
682 }
683 break;
684
685 case TGSI_FILE_OUTPUT:
686 info->output_semantic_name[reg] = (ubyte) semName;
687 info->output_semantic_index[reg] = (ubyte) semIndex;
688 info->output_usagemask[reg] |= fulldecl->Declaration.UsageMask;
689 info->num_outputs = MAX2(info->num_outputs, reg + 1);
690
691 if (fulldecl->Declaration.UsageMask & TGSI_WRITEMASK_X) {
692 info->output_streams[reg] |= (ubyte)fulldecl->Semantic.StreamX;
693 info->num_stream_output_components[fulldecl->Semantic.StreamX]++;
694 }
695 if (fulldecl->Declaration.UsageMask & TGSI_WRITEMASK_Y) {
696 info->output_streams[reg] |= (ubyte)fulldecl->Semantic.StreamY << 2;
697 info->num_stream_output_components[fulldecl->Semantic.StreamY]++;
698 }
699 if (fulldecl->Declaration.UsageMask & TGSI_WRITEMASK_Z) {
700 info->output_streams[reg] |= (ubyte)fulldecl->Semantic.StreamZ << 4;
701 info->num_stream_output_components[fulldecl->Semantic.StreamZ]++;
702 }
703 if (fulldecl->Declaration.UsageMask & TGSI_WRITEMASK_W) {
704 info->output_streams[reg] |= (ubyte)fulldecl->Semantic.StreamW << 6;
705 info->num_stream_output_components[fulldecl->Semantic.StreamW]++;
706 }
707
708 switch (semName) {
709 case TGSI_SEMANTIC_PRIMID:
710 info->writes_primid = true;
711 break;
712 case TGSI_SEMANTIC_VIEWPORT_INDEX:
713 info->writes_viewport_index = true;
714 break;
715 case TGSI_SEMANTIC_LAYER:
716 info->writes_layer = true;
717 break;
718 case TGSI_SEMANTIC_PSIZE:
719 info->writes_psize = true;
720 break;
721 case TGSI_SEMANTIC_CLIPVERTEX:
722 info->writes_clipvertex = true;
723 break;
724 case TGSI_SEMANTIC_COLOR:
725 info->colors_written |= 1 << semIndex;
726 break;
727 case TGSI_SEMANTIC_STENCIL:
728 info->writes_stencil = true;
729 break;
730 case TGSI_SEMANTIC_SAMPLEMASK:
731 info->writes_samplemask = true;
732 break;
733 case TGSI_SEMANTIC_EDGEFLAG:
734 info->writes_edgeflag = true;
735 break;
736 case TGSI_SEMANTIC_POSITION:
737 if (procType == PIPE_SHADER_FRAGMENT)
738 info->writes_z = true;
739 else
740 info->writes_position = true;
741 break;
742 }
743 break;
744
745 case TGSI_FILE_SAMPLER:
746 STATIC_ASSERT(sizeof(info->samplers_declared) * 8 >= PIPE_MAX_SAMPLERS);
747 info->samplers_declared |= 1u << reg;
748 break;
749
750 case TGSI_FILE_SAMPLER_VIEW:
751 target = fulldecl->SamplerView.Resource;
752 type = fulldecl->SamplerView.ReturnTypeX;
753
754 assert(target < TGSI_TEXTURE_UNKNOWN);
755 if (info->sampler_targets[reg] == TGSI_TEXTURE_UNKNOWN) {
756 /* Save sampler target for this sampler index */
757 info->sampler_targets[reg] = target;
758 info->sampler_type[reg] = type;
759 } else {
760 /* if previously declared, make sure targets agree */
761 assert(info->sampler_targets[reg] == target);
762 assert(info->sampler_type[reg] == type);
763 }
764 break;
765 }
766 }
767 }
768
769
770 static void
scan_immediate(struct tgsi_shader_info * info)771 scan_immediate(struct tgsi_shader_info *info)
772 {
773 uint reg = info->immediate_count++;
774 uint file = TGSI_FILE_IMMEDIATE;
775
776 info->file_mask[file] |= (1 << reg);
777 info->file_count[file]++;
778 info->file_max[file] = MAX2(info->file_max[file], (int)reg);
779 }
780
781
782 static void
scan_property(struct tgsi_shader_info * info,const struct tgsi_full_property * fullprop)783 scan_property(struct tgsi_shader_info *info,
784 const struct tgsi_full_property *fullprop)
785 {
786 unsigned name = fullprop->Property.PropertyName;
787 unsigned value = fullprop->u[0].Data;
788
789 assert(name < ARRAY_SIZE(info->properties));
790 info->properties[name] = value;
791
792 switch (name) {
793 case TGSI_PROPERTY_NUM_CLIPDIST_ENABLED:
794 info->num_written_clipdistance = value;
795 info->clipdist_writemask |= (1 << value) - 1;
796 break;
797 case TGSI_PROPERTY_NUM_CULLDIST_ENABLED:
798 info->num_written_culldistance = value;
799 info->culldist_writemask |= (1 << value) - 1;
800 break;
801 }
802 }
803
804
805 /**
806 * Scan the given TGSI shader to collect information such as number of
807 * registers used, special instructions used, etc.
808 * \return info the result of the scan
809 */
810 void
tgsi_scan_shader(const struct tgsi_token * tokens,struct tgsi_shader_info * info)811 tgsi_scan_shader(const struct tgsi_token *tokens,
812 struct tgsi_shader_info *info)
813 {
814 uint procType, i;
815 struct tgsi_parse_context parse;
816 unsigned current_depth = 0;
817
818 memset(info, 0, sizeof(*info));
819 for (i = 0; i < TGSI_FILE_COUNT; i++)
820 info->file_max[i] = -1;
821 for (i = 0; i < ARRAY_SIZE(info->const_file_max); i++)
822 info->const_file_max[i] = -1;
823 info->properties[TGSI_PROPERTY_GS_INVOCATIONS] = 1;
824 for (i = 0; i < ARRAY_SIZE(info->sampler_targets); i++)
825 info->sampler_targets[i] = TGSI_TEXTURE_UNKNOWN;
826
827 /**
828 ** Setup to begin parsing input shader
829 **/
830 if (tgsi_parse_init( &parse, tokens ) != TGSI_PARSE_OK) {
831 debug_printf("tgsi_parse_init() failed in tgsi_scan_shader()!\n");
832 return;
833 }
834 procType = parse.FullHeader.Processor.Processor;
835 assert(procType == PIPE_SHADER_FRAGMENT ||
836 procType == PIPE_SHADER_VERTEX ||
837 procType == PIPE_SHADER_GEOMETRY ||
838 procType == PIPE_SHADER_TESS_CTRL ||
839 procType == PIPE_SHADER_TESS_EVAL ||
840 procType == PIPE_SHADER_COMPUTE);
841 info->processor = procType;
842
843 /**
844 ** Loop over incoming program tokens/instructions
845 */
846 while (!tgsi_parse_end_of_tokens(&parse)) {
847 info->num_tokens++;
848
849 tgsi_parse_token( &parse );
850
851 switch( parse.FullToken.Token.Type ) {
852 case TGSI_TOKEN_TYPE_INSTRUCTION:
853 scan_instruction(info, &parse.FullToken.FullInstruction,
854 ¤t_depth);
855 break;
856 case TGSI_TOKEN_TYPE_DECLARATION:
857 scan_declaration(info, &parse.FullToken.FullDeclaration);
858 break;
859 case TGSI_TOKEN_TYPE_IMMEDIATE:
860 scan_immediate(info);
861 break;
862 case TGSI_TOKEN_TYPE_PROPERTY:
863 scan_property(info, &parse.FullToken.FullProperty);
864 break;
865 default:
866 assert(!"Unexpected TGSI token type");
867 }
868 }
869
870 info->uses_kill = (info->opcode_count[TGSI_OPCODE_KILL_IF] ||
871 info->opcode_count[TGSI_OPCODE_KILL]);
872
873 /* The dimensions of the IN decleration in geometry shader have
874 * to be deduced from the type of the input primitive.
875 */
876 if (procType == PIPE_SHADER_GEOMETRY) {
877 unsigned input_primitive =
878 info->properties[TGSI_PROPERTY_GS_INPUT_PRIM];
879 int num_verts = u_vertices_per_prim(input_primitive);
880 int j;
881 info->file_count[TGSI_FILE_INPUT] = num_verts;
882 info->file_max[TGSI_FILE_INPUT] =
883 MAX2(info->file_max[TGSI_FILE_INPUT], num_verts - 1);
884 for (j = 0; j < num_verts; ++j) {
885 info->file_mask[TGSI_FILE_INPUT] |= (1 << j);
886 }
887 }
888
889 tgsi_parse_free(&parse);
890 }
891
892 /**
893 * Collect information about the arrays of a given register file.
894 *
895 * @param tokens TGSI shader
896 * @param file the register file to scan through
897 * @param max_array_id number of entries in @p arrays; should be equal to the
898 * highest array id, i.e. tgsi_shader_info::array_max[file].
899 * @param arrays info for array of each ID will be written to arrays[ID - 1].
900 */
901 void
tgsi_scan_arrays(const struct tgsi_token * tokens,unsigned file,unsigned max_array_id,struct tgsi_array_info * arrays)902 tgsi_scan_arrays(const struct tgsi_token *tokens,
903 unsigned file,
904 unsigned max_array_id,
905 struct tgsi_array_info *arrays)
906 {
907 struct tgsi_parse_context parse;
908
909 if (tgsi_parse_init(&parse, tokens) != TGSI_PARSE_OK) {
910 debug_printf("tgsi_parse_init() failed in tgsi_scan_arrays()!\n");
911 return;
912 }
913
914 memset(arrays, 0, sizeof(arrays[0]) * max_array_id);
915
916 while (!tgsi_parse_end_of_tokens(&parse)) {
917 struct tgsi_full_instruction *inst;
918
919 tgsi_parse_token(&parse);
920
921 if (parse.FullToken.Token.Type == TGSI_TOKEN_TYPE_DECLARATION) {
922 struct tgsi_full_declaration *decl = &parse.FullToken.FullDeclaration;
923
924 if (decl->Declaration.Array && decl->Declaration.File == file &&
925 decl->Array.ArrayID > 0 && decl->Array.ArrayID <= max_array_id) {
926 struct tgsi_array_info *array = &arrays[decl->Array.ArrayID - 1];
927 assert(!array->declared);
928 array->declared = true;
929 array->range = decl->Range;
930 }
931 }
932
933 if (parse.FullToken.Token.Type != TGSI_TOKEN_TYPE_INSTRUCTION)
934 continue;
935
936 inst = &parse.FullToken.FullInstruction;
937 for (unsigned i = 0; i < inst->Instruction.NumDstRegs; i++) {
938 const struct tgsi_full_dst_register *dst = &inst->Dst[i];
939 if (dst->Register.File != file)
940 continue;
941
942 if (dst->Register.Indirect) {
943 if (dst->Indirect.ArrayID > 0 &&
944 dst->Indirect.ArrayID <= max_array_id) {
945 arrays[dst->Indirect.ArrayID - 1].writemask |= dst->Register.WriteMask;
946 } else {
947 /* Indirect writes without an ArrayID can write anywhere. */
948 for (unsigned j = 0; j < max_array_id; ++j)
949 arrays[j].writemask |= dst->Register.WriteMask;
950 }
951 } else {
952 /* Check whether the write falls into any of the arrays anyway. */
953 for (unsigned j = 0; j < max_array_id; ++j) {
954 struct tgsi_array_info *array = &arrays[j];
955 if (array->declared &&
956 dst->Register.Index >= array->range.First &&
957 dst->Register.Index <= array->range.Last)
958 array->writemask |= dst->Register.WriteMask;
959 }
960 }
961 }
962 }
963
964 tgsi_parse_free(&parse);
965
966 return;
967 }
968
969 static void
check_no_subroutines(const struct tgsi_full_instruction * inst)970 check_no_subroutines(const struct tgsi_full_instruction *inst)
971 {
972 switch (inst->Instruction.Opcode) {
973 case TGSI_OPCODE_BGNSUB:
974 case TGSI_OPCODE_ENDSUB:
975 case TGSI_OPCODE_CAL:
976 unreachable("subroutines unhandled");
977 }
978 }
979
980 static unsigned
get_inst_tessfactor_writemask(const struct tgsi_shader_info * info,const struct tgsi_full_instruction * inst)981 get_inst_tessfactor_writemask(const struct tgsi_shader_info *info,
982 const struct tgsi_full_instruction *inst)
983 {
984 unsigned writemask = 0;
985
986 for (unsigned i = 0; i < inst->Instruction.NumDstRegs; i++) {
987 const struct tgsi_full_dst_register *dst = &inst->Dst[i];
988
989 if (dst->Register.File == TGSI_FILE_OUTPUT &&
990 !dst->Register.Indirect) {
991 unsigned name = info->output_semantic_name[dst->Register.Index];
992
993 if (name == TGSI_SEMANTIC_TESSINNER)
994 writemask |= dst->Register.WriteMask;
995 else if (name == TGSI_SEMANTIC_TESSOUTER)
996 writemask |= dst->Register.WriteMask << 4;
997 }
998 }
999 return writemask;
1000 }
1001
1002 static unsigned
get_block_tessfactor_writemask(const struct tgsi_shader_info * info,struct tgsi_parse_context * parse,unsigned end_opcode)1003 get_block_tessfactor_writemask(const struct tgsi_shader_info *info,
1004 struct tgsi_parse_context *parse,
1005 unsigned end_opcode)
1006 {
1007 struct tgsi_full_instruction *inst;
1008 unsigned writemask = 0;
1009
1010 do {
1011 tgsi_parse_token(parse);
1012 assert(parse->FullToken.Token.Type == TGSI_TOKEN_TYPE_INSTRUCTION);
1013 inst = &parse->FullToken.FullInstruction;
1014 check_no_subroutines(inst);
1015
1016 /* Recursively process nested blocks. */
1017 switch (inst->Instruction.Opcode) {
1018 case TGSI_OPCODE_IF:
1019 case TGSI_OPCODE_UIF:
1020 writemask |=
1021 get_block_tessfactor_writemask(info, parse, TGSI_OPCODE_ENDIF);
1022 continue;
1023
1024 case TGSI_OPCODE_BGNLOOP:
1025 writemask |=
1026 get_block_tessfactor_writemask(info, parse, TGSI_OPCODE_ENDLOOP);
1027 continue;
1028
1029 case TGSI_OPCODE_BARRIER:
1030 unreachable("nested BARRIER is illegal");
1031 continue;
1032 }
1033
1034 writemask |= get_inst_tessfactor_writemask(info, inst);
1035 } while (inst->Instruction.Opcode != end_opcode);
1036
1037 return writemask;
1038 }
1039
1040 static void
get_if_block_tessfactor_writemask(const struct tgsi_shader_info * info,struct tgsi_parse_context * parse,unsigned * upper_block_tf_writemask,unsigned * cond_block_tf_writemask)1041 get_if_block_tessfactor_writemask(const struct tgsi_shader_info *info,
1042 struct tgsi_parse_context *parse,
1043 unsigned *upper_block_tf_writemask,
1044 unsigned *cond_block_tf_writemask)
1045 {
1046 struct tgsi_full_instruction *inst;
1047 unsigned then_tessfactor_writemask = 0;
1048 unsigned else_tessfactor_writemask = 0;
1049 bool is_then = true;
1050
1051 do {
1052 tgsi_parse_token(parse);
1053 assert(parse->FullToken.Token.Type == TGSI_TOKEN_TYPE_INSTRUCTION);
1054 inst = &parse->FullToken.FullInstruction;
1055 check_no_subroutines(inst);
1056
1057 switch (inst->Instruction.Opcode) {
1058 case TGSI_OPCODE_ELSE:
1059 is_then = false;
1060 continue;
1061
1062 /* Recursively process nested blocks. */
1063 case TGSI_OPCODE_IF:
1064 case TGSI_OPCODE_UIF:
1065 get_if_block_tessfactor_writemask(info, parse,
1066 is_then ? &then_tessfactor_writemask :
1067 &else_tessfactor_writemask,
1068 cond_block_tf_writemask);
1069 continue;
1070
1071 case TGSI_OPCODE_BGNLOOP:
1072 *cond_block_tf_writemask |=
1073 get_block_tessfactor_writemask(info, parse, TGSI_OPCODE_ENDLOOP);
1074 continue;
1075
1076 case TGSI_OPCODE_BARRIER:
1077 unreachable("nested BARRIER is illegal");
1078 continue;
1079 }
1080
1081 /* Process an instruction in the current block. */
1082 unsigned writemask = get_inst_tessfactor_writemask(info, inst);
1083
1084 if (writemask) {
1085 if (is_then)
1086 then_tessfactor_writemask |= writemask;
1087 else
1088 else_tessfactor_writemask |= writemask;
1089 }
1090 } while (inst->Instruction.Opcode != TGSI_OPCODE_ENDIF);
1091
1092 if (then_tessfactor_writemask || else_tessfactor_writemask) {
1093 /* If both statements write the same tess factor channels,
1094 * we can say that the upper block writes them too. */
1095 *upper_block_tf_writemask |= then_tessfactor_writemask &
1096 else_tessfactor_writemask;
1097 *cond_block_tf_writemask |= then_tessfactor_writemask |
1098 else_tessfactor_writemask;
1099 }
1100 }
1101
1102 void
tgsi_scan_tess_ctrl(const struct tgsi_token * tokens,const struct tgsi_shader_info * info,struct tgsi_tessctrl_info * out)1103 tgsi_scan_tess_ctrl(const struct tgsi_token *tokens,
1104 const struct tgsi_shader_info *info,
1105 struct tgsi_tessctrl_info *out)
1106 {
1107 memset(out, 0, sizeof(*out));
1108
1109 if (info->processor != PIPE_SHADER_TESS_CTRL)
1110 return;
1111
1112 struct tgsi_parse_context parse;
1113 if (tgsi_parse_init(&parse, tokens) != TGSI_PARSE_OK) {
1114 debug_printf("tgsi_parse_init() failed in tgsi_scan_arrays()!\n");
1115 return;
1116 }
1117
1118 /* The pass works as follows:
1119 * If all codepaths write tess factors, we can say that all invocations
1120 * define tess factors.
1121 *
1122 * Each tess factor channel is tracked separately.
1123 */
1124 unsigned main_block_tf_writemask = 0; /* if main block writes tess factors */
1125 unsigned cond_block_tf_writemask = 0; /* if cond block writes tess factors */
1126
1127 /* Initial value = true. Here the pass will accumulate results from multiple
1128 * segments surrounded by barriers. If tess factors aren't written at all,
1129 * it's a shader bug and we don't care if this will be true.
1130 */
1131 out->tessfactors_are_def_in_all_invocs = true;
1132
1133 while (!tgsi_parse_end_of_tokens(&parse)) {
1134 tgsi_parse_token(&parse);
1135
1136 if (parse.FullToken.Token.Type != TGSI_TOKEN_TYPE_INSTRUCTION)
1137 continue;
1138
1139 struct tgsi_full_instruction *inst = &parse.FullToken.FullInstruction;
1140 check_no_subroutines(inst);
1141
1142 /* Process nested blocks. */
1143 switch (inst->Instruction.Opcode) {
1144 case TGSI_OPCODE_IF:
1145 case TGSI_OPCODE_UIF:
1146 get_if_block_tessfactor_writemask(info, &parse,
1147 &main_block_tf_writemask,
1148 &cond_block_tf_writemask);
1149 continue;
1150
1151 case TGSI_OPCODE_BGNLOOP:
1152 cond_block_tf_writemask |=
1153 get_block_tessfactor_writemask(info, &parse, TGSI_OPCODE_ENDIF);
1154 continue;
1155
1156 case TGSI_OPCODE_BARRIER:
1157 /* The following case must be prevented:
1158 * gl_TessLevelInner = ...;
1159 * barrier();
1160 * if (gl_InvocationID == 1)
1161 * gl_TessLevelInner = ...;
1162 *
1163 * If you consider disjoint code segments separated by barriers, each
1164 * such segment that writes tess factor channels should write the same
1165 * channels in all codepaths within that segment.
1166 */
1167 if (main_block_tf_writemask || cond_block_tf_writemask) {
1168 /* Accumulate the result: */
1169 out->tessfactors_are_def_in_all_invocs &=
1170 !(cond_block_tf_writemask & ~main_block_tf_writemask);
1171
1172 /* Analyze the next code segment from scratch. */
1173 main_block_tf_writemask = 0;
1174 cond_block_tf_writemask = 0;
1175 }
1176 continue;
1177 }
1178
1179 main_block_tf_writemask |= get_inst_tessfactor_writemask(info, inst);
1180 }
1181
1182 /* Accumulate the result for the last code segment separated by a barrier. */
1183 if (main_block_tf_writemask || cond_block_tf_writemask) {
1184 out->tessfactors_are_def_in_all_invocs &=
1185 !(cond_block_tf_writemask & ~main_block_tf_writemask);
1186 }
1187
1188 tgsi_parse_free(&parse);
1189 }
1190