Lines Matching refs:GCN

1 …-verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=GCN -check-prefix=GCN-NOAA %s
2 …-verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=GCN -check-prefix=GCN-NOAA %s
4 …combiner-alias-analysis < %s | FileCheck -check-prefix=SI -check-prefix=GCN -check-prefix=GCN-AA %s
5 …combiner-alias-analysis < %s | FileCheck -check-prefix=SI -check-prefix=GCN -check-prefix=GCN-AA %s
14 ; GCN-LABEL: {{^}}merge_global_store_2_constants_i8:
15 ; GCN: buffer_store_byte
16 ; GCN: buffer_store_byte
17 ; GCN: s_endpgm
26 ; GCN-LABEL: {{^}}merge_global_store_2_constants_i8_natural_align:
27 ; GCN: buffer_store_byte
28 ; GCN: buffer_store_byte
29 ; GCN: s_endpgm
38 ; GCN-LABEL: {{^}}merge_global_store_2_constants_i16:
39 ; GCN: buffer_store_dword v
48 ; GCN-LABEL: {{^}}merge_global_store_2_constants_0_i16:
49 ; GCN: buffer_store_dword v
58 ; GCN-LABEL: {{^}}merge_global_store_2_constants_i16_natural_align:
59 ; GCN: buffer_store_short
60 ; GCN: buffer_store_short
61 ; GCN: s_endpgm
70 ; GCN-LABEL: {{^}}merge_global_store_2_constants_i32:
73 ; GCN: buffer_store_dwordx2 v{{\[}}[[LO]]:[[HI]]{{\]}}
82 ; GCN-LABEL: {{^}}merge_global_store_2_constants_i32_f32:
83 ; GCN: buffer_store_dwordx2
92 ; GCN-LABEL: {{^}}merge_global_store_2_constants_f32_i32:
95 ; GCN: buffer_store_dwordx2 v{{\[}}[[VLO]]:[[VHI]]{{\]}}
104 ; GCN-LABEL: {{^}}merge_global_store_4_constants_i32:
105 ; GCN-DAG: v_mov_b32_e32 v[[HI:[0-9]+]], 0x14d{{$}}
106 ; GCN-DAG: v_mov_b32_e32 v{{[0-9]+}}, 0x1c8{{$}}
107 ; GCN-DAG: v_mov_b32_e32 v{{[0-9]+}}, 0x7b{{$}}
108 ; GCN-DAG: v_mov_b32_e32 v[[LO:[0-9]+]], 0x4d2{{$}}
109 ; GCN: buffer_store_dwordx4 v{{\[}}[[LO]]:[[HI]]{{\]}}
122 ; GCN-LABEL: {{^}}merge_global_store_4_constants_f32_order:
123 ; GCN: buffer_store_dwordx4
137 ; GCN-LABEL: {{^}}merge_global_store_4_constants_f32:
138 ; GCN: buffer_store_dwordx4
152 ; GCN-LABEL: {{^}}merge_global_store_4_constants_mixed_i32_f32:
153 ; GCN-NOAA: buffer_store_dword v
154 ; GCN-NOAA: buffer_store_dword v
155 ; GCN-NOAA: buffer_store_dword v
156 ; GCN-NOAA: buffer_store_dword v
158 ; GCN-AA: buffer_store_dwordx2
159 ; GCN-AA: buffer_store_dword v
160 ; GCN-AA: buffer_store_dword v
162 ; GCN: s_endpgm
178 ; GCN-LABEL: {{^}}merge_global_store_3_constants_i32:
182 ; GCN: s_endpgm
193 ; GCN-LABEL: {{^}}merge_global_store_2_constants_i64:
194 ; GCN: buffer_store_dwordx4
203 ; GCN-LABEL: {{^}}merge_global_store_4_constants_i64:
204 ; GCN: buffer_store_dwordx4
205 ; GCN: buffer_store_dwordx4
218 ; GCN-LABEL: {{^}}merge_global_store_2_adjacent_loads_i32:
219 ; GCN: buffer_load_dwordx2 [[LOAD:v\[[0-9]+:[0-9]+\]]]
220 ; GCN: buffer_store_dwordx2 [[LOAD]]
233 ; GCN-LABEL: {{^}}merge_global_store_2_adjacent_loads_i32_nonzero_base:
234 ; GCN: buffer_load_dwordx2 [[LOAD:v\[[0-9]+:[0-9]+\]]], s{{\[[0-9]+:[0-9]+\]}}, 0 offset:8
235 ; GCN: buffer_store_dwordx2 [[LOAD]], s{{\[[0-9]+:[0-9]+\]}}, 0 offset:8
250 ; GCN-LABEL: {{^}}merge_global_store_2_adjacent_loads_shuffle_i32:
251 ; GCN: buffer_load_dword v
252 ; GCN: buffer_load_dword v
253 ; GCN: buffer_store_dword v
254 ; GCN: buffer_store_dword v
267 ; GCN-LABEL: {{^}}merge_global_store_4_adjacent_loads_i32:
268 ; GCN: buffer_load_dwordx4 [[LOAD:v\[[0-9]+:[0-9]+\]]]
269 ; GCN: buffer_store_dwordx4 [[LOAD]]
290 ; GCN-LABEL: {{^}}merge_global_store_3_adjacent_loads_i32:
293 ; GCN: s_waitcnt
296 ; GCN: s_endpgm
313 ; GCN-LABEL: {{^}}merge_global_store_4_adjacent_loads_f32:
314 ; GCN: buffer_load_dwordx4 [[LOAD:v\[[0-9]+:[0-9]+\]]]
315 ; GCN: buffer_store_dwordx4 [[LOAD]]
336 ; GCN-LABEL: {{^}}merge_global_store_4_adjacent_loads_i32_nonzero_base:
337 ; GCN: buffer_load_dwordx4 [[LOAD:v\[[0-9]+:[0-9]+\]]], s{{\[[0-9]+:[0-9]+\]}}, 0 offset:44
338 ; GCN: buffer_store_dwordx4 [[LOAD]], s{{\[[0-9]+:[0-9]+\]}}, 0 offset:28
361 ; GCN-LABEL: {{^}}merge_global_store_4_adjacent_loads_inverse_i32:
362 ; GCN: buffer_load_dwordx4 [[LOAD:v\[[0-9]+:[0-9]+\]]]
363 ; GCN: s_barrier
364 ; GCN: buffer_store_dwordx4 [[LOAD]]
392 ; GCN-LABEL: {{^}}merge_global_store_4_adjacent_loads_shuffle_i32:
393 ; GCN: buffer_load_dword v
394 ; GCN: buffer_load_dword v
395 ; GCN: buffer_load_dword v
396 ; GCN: buffer_load_dword v
397 ; GCN: s_barrier
398 ; GCN: buffer_store_dword v
399 ; GCN: buffer_store_dword v
400 ; GCN: buffer_store_dword v
401 ; GCN: buffer_store_dword v
426 ; GCN-LABEL: {{^}}merge_global_store_4_adjacent_loads_i8:
427 ; GCN: buffer_load_dword [[LOAD:v[0-9]+]]
428 ; GCN: buffer_store_dword [[LOAD]]
429 ; GCN: s_endpgm
450 ; GCN-LABEL: {{^}}merge_global_store_4_adjacent_loads_i8_natural_align:
451 ; GCN: buffer_load_ubyte
452 ; GCN: buffer_load_ubyte
453 ; GCN: buffer_load_ubyte
454 ; GCN: buffer_load_ubyte
455 ; GCN: buffer_store_byte
456 ; GCN: buffer_store_byte
457 ; GCN: buffer_store_byte
458 ; GCN: buffer_store_byte
459 ; GCN: s_endpgm
481 ; GCN-LABEL: {{^}}merge_global_store_4_vector_elts_loads_v4i32:
482 ; GCN: buffer_load_dwordx4 [[LOAD:v\[[0-9]+:[0-9]+\]]]
484 ; GCN-NOAA: buffer_store_dword v
485 ; GCN-NOAA: buffer_store_dword v
486 ; GCN-NOAA: buffer_store_dword v
487 ; GCN-NOAA: buffer_store_dword v
489 ; GCN-AA: buffer_store_dwordx4 [[LOAD]]
491 ; GCN: s_endpgm
510 ; GCN-LABEL: {{^}}merge_local_store_2_constants_i8:
511 ; GCN: ds_write_b8
512 ; GCN: ds_write_b8
513 ; GCN: s_endpgm
522 ; GCN-LABEL: {{^}}merge_local_store_2_constants_i32:
523 ; GCN-DAG: v_mov_b32_e32 v[[LO:[0-9]+]], 0x1c8
524 ; GCN-DAG: v_mov_b32_e32 v[[HI:[0-9]+]], 0x7b
525 ; GCN: ds_write2_b32 v{{[0-9]+}}, v[[LO]], v[[HI]] offset1:1{{$}}
534 ; GCN-LABEL: {{^}}merge_local_store_4_constants_i32:
535 ; GCN-DAG: v_mov_b32_e32 [[K2:v[0-9]+]], 0x1c8
536 ; GCN-DAG: v_mov_b32_e32 [[K3:v[0-9]+]], 0x14d
537 ; GCN-DAG: ds_write2_b32 v{{[0-9]+}}, [[K2]], [[K3]] offset0:2 offset1:3
539 ; GCN-DAG: v_mov_b32_e32 [[K0:v[0-9]+]], 0x4d2
540 ; GCN-DAG: v_mov_b32_e32 [[K1:v[0-9]+]], 0x7b
541 ; GCN-DAG: ds_write2_b32 v{{[0-9]+}}, [[K0]], [[K1]] offset1:1
543 ; GCN: s_endpgm
556 ; GCN-LABEL: {{^}}merge_global_store_5_constants_i32:
557 ; GCN-DAG: v_mov_b32_e32 v[[LO:[0-9]+]], 9{{$}}
558 ; GCN-DAG: v_mov_b32_e32 v[[HI4:[0-9]+]], -12{{$}}
559 ; GCN: buffer_store_dwordx4 v{{\[}}[[LO]]:[[HI4]]{{\]}}
560 ; GCN: v_mov_b32_e32 v[[HI:[0-9]+]], 11{{$}}
561 ; GCN: buffer_store_dword v[[HI]]
575 ; GCN-LABEL: {{^}}merge_global_store_6_constants_i32:
576 ; GCN: buffer_store_dwordx4
577 ; GCN: buffer_store_dwordx2
593 ; GCN-LABEL: {{^}}merge_global_store_7_constants_i32:
594 ; GCN: buffer_store_dwordx4
595 ; GCN: buffer_store_dwordx2
596 ; GCN: buffer_store_dword v
614 ; GCN-LABEL: {{^}}merge_global_store_8_constants_i32:
615 ; GCN: buffer_store_dwordx4
616 ; GCN: buffer_store_dwordx4
617 ; GCN: s_endpgm
641 ; GCN-LABEL: {{^}}copy_v3i32_align4:
642 ; GCN-NOT: SCRATCH_RSRC_DWORD
643 ; GCN-DAG: buffer_load_dword v{{[0-9]+}}, s{{\[[0-9]+:[0-9]+\]}}, 0 offset:8
644 ; GCN-DAG: buffer_load_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0{{$}}
645 ; GCN-NOT: offen
646 ; GCN: s_waitcnt vmcnt
647 ; GCN-NOT: offen
648 ; GCN-DAG: buffer_store_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0{{$}}
649 ; GCN-DAG: buffer_store_dword v{{[0-9]+}}, s{{\[[0-9]+:[0-9]+\]}}, 0 offset:8
651 ; GCN: ScratchSize: 0{{$}}
658 ; GCN-LABEL: {{^}}copy_v3i64_align4:
659 ; GCN-NOT: SCRATCH_RSRC_DWORD
660 ; GCN-DAG: buffer_load_dwordx4 v{{\[[0-9]+:[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0{{$}}
661 ; GCN-DAG: buffer_load_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0 offset:16{{$}}
662 ; GCN-NOT: offen
663 ; GCN: s_waitcnt vmcnt
664 ; GCN-NOT: offen
665 ; GCN-DAG: buffer_store_dwordx4 v{{\[[0-9]+:[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0{{$}}
666 ; GCN-DAG: buffer_store_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0 offset:16{{$}}
667 ; GCN: ScratchSize: 0{{$}}
674 ; GCN-LABEL: {{^}}copy_v3f32_align4:
675 ; GCN-NOT: SCRATCH_RSRC_DWORD
676 ; GCN-DAG: buffer_load_dword v{{[0-9]+}}, s{{\[[0-9]+:[0-9]+\]}}, 0 offset:8
677 ; GCN-DAG: buffer_load_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0{{$}}
678 ; GCN-NOT: offen
679 ; GCN: s_waitcnt vmcnt
680 ; GCN-NOT: offen
681 ; GCN-DAG: buffer_store_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0{{$}}
682 ; GCN-DAG: buffer_store_dword v{{[0-9]+}}, s{{\[[0-9]+:[0-9]+\]}}, 0 offset:8
683 ; GCN: ScratchSize: 0{{$}}
691 ; GCN-LABEL: {{^}}copy_v3f64_align4:
692 ; GCN-NOT: SCRATCH_RSRC_DWORD
693 ; GCN-DAG: buffer_load_dwordx4 v{{\[[0-9]+:[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0{{$}}
694 ; GCN-DAG: buffer_load_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0 offset:16{{$}}
695 ; GCN-NOT: offen
696 ; GCN: s_waitcnt vmcnt
697 ; GCN-NOT: offen
698 ; GCN-DAG: buffer_store_dwordx4 v{{\[[0-9]+:[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0{{$}}
699 ; GCN-DAG: buffer_store_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0 offset:16{{$}}
700 ; GCN: ScratchSize: 0{{$}}