Lines Matching refs:GFX906
3 …ote-alloca,+sram-ecc -verify-machineinstrs < %s | FileCheck -check-prefixes=GCN,GFX906,NO-D16-HI %s
15 ; GFX906-LABEL: load_local_lo_v2i16_undeflo:
16 ; GFX906: ; %bb.0: ; %entry
17 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
18 ; GFX906-NEXT: ds_read_u16 v0, v0
19 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
20 ; GFX906-NEXT: s_setpc_b64 s[30:31]
45 ; GFX906-LABEL: load_local_lo_v2i16_reglo:
46 ; GFX906: ; %bb.0: ; %entry
47 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
48 ; GFX906-NEXT: ds_read_u16 v0, v0
49 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
50 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
51 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
52 ; GFX906-NEXT: s_setpc_b64 s[30:31]
83 ; GFX906-LABEL: load_local_lo_v2i16_reglo_vreg:
84 ; GFX906: ; %bb.0: ; %entry
85 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
86 ; GFX906-NEXT: ds_read_u16 v0, v0
87 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
88 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
89 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
90 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
91 ; GFX906-NEXT: s_waitcnt vmcnt(0)
92 ; GFX906-NEXT: s_setpc_b64 s[30:31]
123 ; GFX906-LABEL: load_local_lo_v2i16_zerolo:
124 ; GFX906: ; %bb.0: ; %entry
125 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
126 ; GFX906-NEXT: ds_read_u16 v0, v0
127 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
128 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
129 ; GFX906-NEXT: s_setpc_b64 s[30:31]
154 ; GFX906-LABEL: load_local_lo_v2f16_fpimm:
155 ; GFX906: ; %bb.0: ; %entry
156 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
157 ; GFX906-NEXT: ds_read_u16 v0, v0
158 ; GFX906-NEXT: s_movk_i32 s4, 0x4000
159 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
160 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
161 ; GFX906-NEXT: v_lshl_or_b32 v0, s4, 16, v0
162 ; GFX906-NEXT: s_setpc_b64 s[30:31]
188 ; GFX906-LABEL: load_local_lo_v2f16_reghi_vreg:
189 ; GFX906: ; %bb.0: ; %entry
190 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
191 ; GFX906-NEXT: ds_read_u16 v0, v0
192 ; GFX906-NEXT: v_lshrrev_b32_e32 v1, 16, v1
193 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
194 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
195 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
196 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
197 ; GFX906-NEXT: s_waitcnt vmcnt(0)
198 ; GFX906-NEXT: s_setpc_b64 s[30:31]
231 ; GFX906-LABEL: load_local_lo_v2f16_reglo_vreg:
232 ; GFX906: ; %bb.0: ; %entry
233 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
234 ; GFX906-NEXT: ds_read_u16 v0, v0
235 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
236 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
237 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
238 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
239 ; GFX906-NEXT: s_waitcnt vmcnt(0)
240 ; GFX906-NEXT: s_setpc_b64 s[30:31]
271 ; GFX906-LABEL: load_local_lo_v2i16_reghi_vreg_zexti8:
272 ; GFX906: ; %bb.0: ; %entry
273 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
274 ; GFX906-NEXT: ds_read_u8 v0, v0
275 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
276 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
277 ; GFX906-NEXT: v_bfi_b32 v0, v2, v0, v1
278 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
279 ; GFX906-NEXT: s_waitcnt vmcnt(0)
280 ; GFX906-NEXT: s_setpc_b64 s[30:31]
315 ; GFX906-LABEL: load_local_lo_v2i16_reglo_vreg_zexti8:
316 ; GFX906: ; %bb.0: ; %entry
317 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
318 ; GFX906-NEXT: ds_read_u8 v0, v0
319 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
320 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
321 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
322 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
323 ; GFX906-NEXT: s_waitcnt vmcnt(0)
324 ; GFX906-NEXT: s_setpc_b64 s[30:31]
356 ; GFX906-LABEL: load_local_lo_v2i16_reghi_vreg_sexti8:
357 ; GFX906: ; %bb.0: ; %entry
358 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
359 ; GFX906-NEXT: ds_read_i8 v0, v0
360 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
361 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
362 ; GFX906-NEXT: v_bfi_b32 v0, v2, v0, v1
363 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
364 ; GFX906-NEXT: s_waitcnt vmcnt(0)
365 ; GFX906-NEXT: s_setpc_b64 s[30:31]
399 ; GFX906-LABEL: load_local_lo_v2i16_reglo_vreg_sexti8:
400 ; GFX906: ; %bb.0: ; %entry
401 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
402 ; GFX906-NEXT: ds_read_i8 v0, v0
403 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
404 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
405 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
406 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
407 ; GFX906-NEXT: s_waitcnt vmcnt(0)
408 ; GFX906-NEXT: s_setpc_b64 s[30:31]
442 ; GFX906-LABEL: load_local_lo_v2f16_reglo_vreg_zexti8:
443 ; GFX906: ; %bb.0: ; %entry
444 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
445 ; GFX906-NEXT: ds_read_u8 v0, v0
446 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
447 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
448 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
449 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
450 ; GFX906-NEXT: s_waitcnt vmcnt(0)
451 ; GFX906-NEXT: s_setpc_b64 s[30:31]
486 ; GFX906-LABEL: load_local_lo_v2f16_reglo_vreg_sexti8:
487 ; GFX906: ; %bb.0: ; %entry
488 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
489 ; GFX906-NEXT: ds_read_i8 v0, v0
490 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
491 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
492 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
493 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
494 ; GFX906-NEXT: s_waitcnt vmcnt(0)
495 ; GFX906-NEXT: s_setpc_b64 s[30:31]
532 ; GFX906-LABEL: load_local_lo_v2i16_reghi_vreg_multi_use_lo:
533 ; GFX906: ; %bb.0: ; %entry
534 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
535 ; GFX906-NEXT: ds_read_u16 v0, v0
536 ; GFX906-NEXT: v_mov_b32_e32 v2, 0
537 ; GFX906-NEXT: v_mov_b32_e32 v3, 0xffff
538 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
539 ; GFX906-NEXT: ds_write_b16 v2, v0
540 ; GFX906-NEXT: v_bfi_b32 v0, v3, v0, v1
541 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
542 ; GFX906-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
543 ; GFX906-NEXT: s_setpc_b64 s[30:31]
580 ; GFX906-LABEL: load_local_lo_v2i16_reghi_vreg_multi_use_hi:
581 ; GFX906: ; %bb.0: ; %entry
582 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
583 ; GFX906-NEXT: ds_read_u16 v0, v0
584 ; GFX906-NEXT: v_lshrrev_b32_e32 v2, 16, v1
585 ; GFX906-NEXT: v_mov_b32_e32 v3, 0
586 ; GFX906-NEXT: ds_write_b16 v3, v2
587 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
588 ; GFX906-NEXT: s_waitcnt lgkmcnt(1)
589 ; GFX906-NEXT: v_bfi_b32 v0, v2, v0, v1
590 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
591 ; GFX906-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
592 ; GFX906-NEXT: s_setpc_b64 s[30:31]
632 ; GFX906-LABEL: load_local_lo_v2i16_reghi_vreg_multi_use_lohi:
633 ; GFX906: ; %bb.0: ; %entry
634 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
635 ; GFX906-NEXT: ds_read_u16 v0, v0
636 ; GFX906-NEXT: v_lshrrev_b32_e32 v4, 16, v1
637 ; GFX906-NEXT: s_waitcnt lgkmcnt(0)
638 ; GFX906-NEXT: ds_write_b16 v2, v0
639 ; GFX906-NEXT: ds_write_b16 v3, v4
640 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
641 ; GFX906-NEXT: v_bfi_b32 v0, v2, v0, v1
642 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
643 ; GFX906-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
644 ; GFX906-NEXT: s_setpc_b64 s[30:31]
680 ; GFX906-LABEL: load_global_lo_v2i16_reglo_vreg:
681 ; GFX906: ; %bb.0: ; %entry
682 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
683 ; GFX906-NEXT: global_load_ushort v0, v[0:1], off offset:-4094
684 ; GFX906-NEXT: v_mov_b32_e32 v1, 0xffff
685 ; GFX906-NEXT: s_waitcnt vmcnt(0)
686 ; GFX906-NEXT: v_bfi_b32 v0, v1, v0, v2
687 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
688 ; GFX906-NEXT: s_waitcnt vmcnt(0)
689 ; GFX906-NEXT: s_setpc_b64 s[30:31]
722 ; GFX906-LABEL: load_global_lo_v2f16_reglo_vreg:
723 ; GFX906: ; %bb.0: ; %entry
724 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
725 ; GFX906-NEXT: global_load_ushort v0, v[0:1], off offset:-4094
726 ; GFX906-NEXT: v_lshrrev_b32_e32 v1, 16, v2
727 ; GFX906-NEXT: s_waitcnt vmcnt(0)
728 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
729 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
730 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
731 ; GFX906-NEXT: s_waitcnt vmcnt(0)
732 ; GFX906-NEXT: s_setpc_b64 s[30:31]
765 ; GFX906-LABEL: load_global_lo_v2i16_reglo_vreg_zexti8:
766 ; GFX906: ; %bb.0: ; %entry
767 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
768 ; GFX906-NEXT: global_load_ubyte v0, v[0:1], off offset:-4095
769 ; GFX906-NEXT: v_mov_b32_e32 v1, 0xffff
770 ; GFX906-NEXT: s_waitcnt vmcnt(0)
771 ; GFX906-NEXT: v_bfi_b32 v0, v1, v0, v2
772 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
773 ; GFX906-NEXT: s_waitcnt vmcnt(0)
774 ; GFX906-NEXT: s_setpc_b64 s[30:31]
809 ; GFX906-LABEL: load_global_lo_v2i16_reglo_vreg_sexti8:
810 ; GFX906: ; %bb.0: ; %entry
811 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
812 ; GFX906-NEXT: global_load_sbyte v0, v[0:1], off offset:-4095
813 ; GFX906-NEXT: v_mov_b32_e32 v1, 0xffff
814 ; GFX906-NEXT: s_waitcnt vmcnt(0)
815 ; GFX906-NEXT: v_bfi_b32 v0, v1, v0, v2
816 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
817 ; GFX906-NEXT: s_waitcnt vmcnt(0)
818 ; GFX906-NEXT: s_setpc_b64 s[30:31]
852 ; GFX906-LABEL: load_global_lo_v2f16_reglo_vreg_zexti8:
853 ; GFX906: ; %bb.0: ; %entry
854 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
855 ; GFX906-NEXT: global_load_ubyte v0, v[0:1], off offset:-4095
856 ; GFX906-NEXT: v_lshrrev_b32_e32 v1, 16, v2
857 ; GFX906-NEXT: s_waitcnt vmcnt(0)
858 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
859 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
860 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
861 ; GFX906-NEXT: s_waitcnt vmcnt(0)
862 ; GFX906-NEXT: s_setpc_b64 s[30:31]
898 ; GFX906-LABEL: load_global_lo_v2f16_reglo_vreg_sexti8:
899 ; GFX906: ; %bb.0: ; %entry
900 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
901 ; GFX906-NEXT: global_load_sbyte v0, v[0:1], off offset:-4095
902 ; GFX906-NEXT: v_lshrrev_b32_e32 v1, 16, v2
903 ; GFX906-NEXT: s_waitcnt vmcnt(0)
904 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
905 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
906 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
907 ; GFX906-NEXT: s_waitcnt vmcnt(0)
908 ; GFX906-NEXT: s_setpc_b64 s[30:31]
943 ; GFX906-LABEL: load_flat_lo_v2i16_reghi_vreg:
944 ; GFX906: ; %bb.0: ; %entry
945 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
946 ; GFX906-NEXT: flat_load_ushort v0, v[0:1]
947 ; GFX906-NEXT: v_mov_b32_e32 v1, 0xffff
948 ; GFX906-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
949 ; GFX906-NEXT: v_bfi_b32 v0, v1, v0, v2
950 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
951 ; GFX906-NEXT: s_waitcnt vmcnt(0)
952 ; GFX906-NEXT: s_setpc_b64 s[30:31]
982 ; GFX906-LABEL: load_flat_lo_v2f16_reghi_vreg:
983 ; GFX906: ; %bb.0: ; %entry
984 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
985 ; GFX906-NEXT: flat_load_ushort v0, v[0:1]
986 ; GFX906-NEXT: v_lshrrev_b32_e32 v1, 16, v2
987 ; GFX906-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
988 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
989 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
990 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
991 ; GFX906-NEXT: s_waitcnt vmcnt(0)
992 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1024 ; GFX906-LABEL: load_flat_lo_v2i16_reglo_vreg_zexti8:
1025 ; GFX906: ; %bb.0: ; %entry
1026 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1027 ; GFX906-NEXT: flat_load_ubyte v0, v[0:1]
1028 ; GFX906-NEXT: v_mov_b32_e32 v1, 0xffff
1029 ; GFX906-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
1030 ; GFX906-NEXT: v_bfi_b32 v0, v1, v0, v2
1031 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1032 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1033 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1065 ; GFX906-LABEL: load_flat_lo_v2i16_reglo_vreg_sexti8:
1066 ; GFX906: ; %bb.0: ; %entry
1067 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1068 ; GFX906-NEXT: flat_load_sbyte v0, v[0:1]
1069 ; GFX906-NEXT: v_mov_b32_e32 v1, 0xffff
1070 ; GFX906-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
1071 ; GFX906-NEXT: v_bfi_b32 v0, v1, v0, v2
1072 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1073 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1074 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1105 ; GFX906-LABEL: load_flat_lo_v2f16_reglo_vreg_zexti8:
1106 ; GFX906: ; %bb.0: ; %entry
1107 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1108 ; GFX906-NEXT: flat_load_ubyte v0, v[0:1]
1109 ; GFX906-NEXT: v_lshrrev_b32_e32 v1, 16, v2
1110 ; GFX906-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
1111 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
1112 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
1113 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1114 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1115 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1148 ; GFX906-LABEL: load_flat_lo_v2f16_reglo_vreg_sexti8:
1149 ; GFX906: ; %bb.0: ; %entry
1150 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1151 ; GFX906-NEXT: flat_load_sbyte v0, v[0:1]
1152 ; GFX906-NEXT: v_lshrrev_b32_e32 v1, 16, v2
1153 ; GFX906-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
1154 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
1155 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
1156 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1157 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1158 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1190 ; GFX906-LABEL: load_private_lo_v2i16_reglo_vreg:
1191 ; GFX906: ; %bb.0: ; %entry
1192 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1193 ; GFX906-NEXT: buffer_load_ushort v1, off, s[0:3], s32 offset:4094
1194 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
1195 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1196 ; GFX906-NEXT: v_bfi_b32 v0, v2, v1, v0
1197 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1198 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1199 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1241 ; GFX906-LABEL: load_private_lo_v2i16_reghi_vreg:
1242 ; GFX906: ; %bb.0: ; %entry
1243 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1244 ; GFX906-NEXT: buffer_load_ushort v1, off, s[0:3], s32 offset:4094
1245 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1246 ; GFX906-NEXT: v_and_b32_e32 v1, 0xffff, v1
1247 ; GFX906-NEXT: v_lshl_or_b32 v0, v0, 16, v1
1248 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1249 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1250 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1292 ; GFX906-LABEL: load_private_lo_v2f16_reglo_vreg:
1293 ; GFX906: ; %bb.0: ; %entry
1294 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1295 ; GFX906-NEXT: buffer_load_ushort v1, off, s[0:3], s32 offset:4094
1296 ; GFX906-NEXT: v_lshrrev_b32_e32 v0, 16, v0
1297 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1298 ; GFX906-NEXT: v_and_b32_e32 v1, 0xffff, v1
1299 ; GFX906-NEXT: v_lshl_or_b32 v0, v0, 16, v1
1300 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1301 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1302 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1342 ; GFX906-LABEL: load_private_lo_v2i16_reglo_vreg_nooff:
1343 ; GFX906: ; %bb.0: ; %entry
1344 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1345 ; GFX906-NEXT: buffer_load_ushort v0, off, s[0:3], 0 offset:4094
1346 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
1347 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1348 ; GFX906-NEXT: v_bfi_b32 v0, v2, v0, v1
1349 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1350 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1351 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1391 ; GFX906-LABEL: load_private_lo_v2i16_reghi_vreg_nooff:
1392 ; GFX906: ; %bb.0: ; %entry
1393 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1394 ; GFX906-NEXT: buffer_load_ushort v0, off, s[0:3], 0 offset:4094
1395 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
1396 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1397 ; GFX906-NEXT: v_bfi_b32 v0, v2, v0, v1
1398 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1399 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1400 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1440 ; GFX906-LABEL: load_private_lo_v2f16_reglo_vreg_nooff:
1441 ; GFX906: ; %bb.0: ; %entry
1442 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1443 ; GFX906-NEXT: buffer_load_ushort v0, off, s[0:3], 0 offset:4094
1444 ; GFX906-NEXT: v_lshrrev_b32_e32 v1, 16, v1
1445 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1446 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
1447 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
1448 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1449 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1450 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1490 ; GFX906-LABEL: load_private_lo_v2i16_reglo_vreg_zexti8:
1491 ; GFX906: ; %bb.0: ; %entry
1492 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1493 ; GFX906-NEXT: buffer_load_ubyte v1, off, s[0:3], s32 offset:4095
1494 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
1495 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1496 ; GFX906-NEXT: v_bfi_b32 v0, v2, v1, v0
1497 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1498 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1499 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1541 ; GFX906-LABEL: load_private_lo_v2i16_reglo_vreg_sexti8:
1542 ; GFX906: ; %bb.0: ; %entry
1543 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1544 ; GFX906-NEXT: buffer_load_sbyte v1, off, s[0:3], s32 offset:4095
1545 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
1546 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1547 ; GFX906-NEXT: v_bfi_b32 v0, v2, v1, v0
1548 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1549 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1550 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1591 ; GFX906-LABEL: load_private_lo_v2i16_reglo_vreg_nooff_zexti8:
1592 ; GFX906: ; %bb.0: ; %entry
1593 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1594 ; GFX906-NEXT: buffer_load_ubyte v0, off, s[0:3], 0 offset:4094
1595 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
1596 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1597 ; GFX906-NEXT: v_bfi_b32 v0, v2, v0, v1
1598 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1599 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1600 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1642 ; GFX906-LABEL: load_private_lo_v2i16_reglo_vreg_nooff_sexti8:
1643 ; GFX906: ; %bb.0: ; %entry
1644 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1645 ; GFX906-NEXT: buffer_load_sbyte v0, off, s[0:3], 0 offset:4094
1646 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
1647 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1648 ; GFX906-NEXT: v_bfi_b32 v0, v2, v0, v1
1649 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1650 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1651 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1692 ; GFX906-LABEL: load_private_lo_v2f16_reglo_vreg_nooff_zexti8:
1693 ; GFX906: ; %bb.0: ; %entry
1694 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1695 ; GFX906-NEXT: buffer_load_ubyte v0, off, s[0:3], 0 offset:4094
1696 ; GFX906-NEXT: v_lshrrev_b32_e32 v1, 16, v1
1697 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1698 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
1699 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
1700 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1701 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1702 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1745 ; GFX906-LABEL: load_constant_lo_v2i16_reglo_vreg:
1746 ; GFX906: ; %bb.0: ; %entry
1747 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1748 ; GFX906-NEXT: global_load_ushort v0, v[0:1], off offset:-4094
1749 ; GFX906-NEXT: v_mov_b32_e32 v1, 0xffff
1750 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1751 ; GFX906-NEXT: v_bfi_b32 v0, v1, v0, v2
1752 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1753 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1754 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1787 ; GFX906-LABEL: load_constant_lo_v2f16_reglo_vreg:
1788 ; GFX906: ; %bb.0: ; %entry
1789 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1790 ; GFX906-NEXT: global_load_ushort v0, v[0:1], off offset:-4094
1791 ; GFX906-NEXT: v_lshrrev_b32_e32 v1, 16, v2
1792 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1793 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
1794 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
1795 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1796 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1797 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1830 ; GFX906-LABEL: load_constant_lo_v2f16_reglo_vreg_zexti8:
1831 ; GFX906: ; %bb.0: ; %entry
1832 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1833 ; GFX906-NEXT: global_load_ubyte v0, v[0:1], off offset:-4095
1834 ; GFX906-NEXT: v_lshrrev_b32_e32 v1, 16, v2
1835 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1836 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
1837 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
1838 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1839 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1840 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1876 ; GFX906-LABEL: load_constant_lo_v2f16_reglo_vreg_sexti8:
1877 ; GFX906: ; %bb.0: ; %entry
1878 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1879 ; GFX906-NEXT: global_load_sbyte v0, v[0:1], off offset:-4095
1880 ; GFX906-NEXT: v_lshrrev_b32_e32 v1, 16, v2
1881 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1882 ; GFX906-NEXT: v_and_b32_e32 v0, 0xffff, v0
1883 ; GFX906-NEXT: v_lshl_or_b32 v0, v1, 16, v0
1884 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1885 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1886 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1923 ; GFX906-LABEL: load_private_lo_v2i16_reglo_vreg_to_offset:
1924 ; GFX906: ; %bb.0: ; %entry
1925 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1926 ; GFX906-NEXT: v_mov_b32_e32 v1, 0x7b
1927 ; GFX906-NEXT: buffer_store_dword v1, off, s[0:3], s32
1928 ; GFX906-NEXT: buffer_load_ushort v1, off, s[0:3], s32 offset:4094
1929 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
1930 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1931 ; GFX906-NEXT: v_bfi_b32 v0, v2, v1, v0
1932 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1933 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1934 ; GFX906-NEXT: s_setpc_b64 s[30:31]
1984 ; GFX906-LABEL: load_private_lo_v2i16_reglo_vreg_sexti8_to_offset:
1985 ; GFX906: ; %bb.0: ; %entry
1986 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
1987 ; GFX906-NEXT: v_mov_b32_e32 v1, 0x7b
1988 ; GFX906-NEXT: buffer_store_dword v1, off, s[0:3], s32
1989 ; GFX906-NEXT: buffer_load_sbyte v1, off, s[0:3], s32 offset:4095
1990 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
1991 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1992 ; GFX906-NEXT: v_bfi_b32 v0, v2, v1, v0
1993 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
1994 ; GFX906-NEXT: s_waitcnt vmcnt(0)
1995 ; GFX906-NEXT: s_setpc_b64 s[30:31]
2046 ; GFX906-LABEL: load_private_lo_v2i16_reglo_vreg_zexti8_to_offset:
2047 ; GFX906: ; %bb.0: ; %entry
2048 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
2049 ; GFX906-NEXT: v_mov_b32_e32 v1, 0x7b
2050 ; GFX906-NEXT: buffer_store_dword v1, off, s[0:3], s32
2051 ; GFX906-NEXT: buffer_load_ubyte v1, off, s[0:3], s32 offset:4095
2052 ; GFX906-NEXT: v_mov_b32_e32 v2, 0xffff
2053 ; GFX906-NEXT: s_waitcnt vmcnt(0)
2054 ; GFX906-NEXT: v_bfi_b32 v0, v2, v1, v0
2055 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
2056 ; GFX906-NEXT: s_waitcnt vmcnt(0)
2057 ; GFX906-NEXT: s_setpc_b64 s[30:31]
2109 ; GFX906-LABEL: load_private_lo_v2f16_reglo_vreg_sexti8_to_offset:
2110 ; GFX906: ; %bb.0: ; %entry
2111 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
2112 ; GFX906-NEXT: v_mov_b32_e32 v1, 0x7b
2113 ; GFX906-NEXT: buffer_store_dword v1, off, s[0:3], s32
2114 ; GFX906-NEXT: buffer_load_sbyte v1, off, s[0:3], s32 offset:4095
2115 ; GFX906-NEXT: v_lshrrev_b32_e32 v0, 16, v0
2116 ; GFX906-NEXT: s_waitcnt vmcnt(0)
2117 ; GFX906-NEXT: v_and_b32_e32 v1, 0xffff, v1
2118 ; GFX906-NEXT: v_lshl_or_b32 v0, v0, 16, v1
2119 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
2120 ; GFX906-NEXT: s_waitcnt vmcnt(0)
2121 ; GFX906-NEXT: s_setpc_b64 s[30:31]
2173 ; GFX906-LABEL: load_private_lo_v2f16_reglo_vreg_zexti8_to_offset:
2174 ; GFX906: ; %bb.0: ; %entry
2175 ; GFX906-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
2176 ; GFX906-NEXT: v_mov_b32_e32 v1, 0x7b
2177 ; GFX906-NEXT: buffer_store_dword v1, off, s[0:3], s32
2178 ; GFX906-NEXT: buffer_load_ubyte v1, off, s[0:3], s32 offset:4095
2179 ; GFX906-NEXT: v_lshrrev_b32_e32 v0, 16, v0
2180 ; GFX906-NEXT: s_waitcnt vmcnt(0)
2181 ; GFX906-NEXT: v_and_b32_e32 v1, 0xffff, v1
2182 ; GFX906-NEXT: v_lshl_or_b32 v0, v0, 16, v1
2183 ; GFX906-NEXT: global_store_dword v[0:1], v0, off
2184 ; GFX906-NEXT: s_waitcnt vmcnt(0)
2185 ; GFX906-NEXT: s_setpc_b64 s[30:31]