/external/llvm-project/llvm/test/CodeGen/AMDGPU/GlobalISel/ |
D | lshr.ll | 62 ; GFX6-NEXT: s_lshr_b32 s0, s0, s1 70 ; GFX8-NEXT: s_lshr_b32 s0, s0, s1 78 ; GFX9-NEXT: s_lshr_b32 s0, s0, s1 88 ; GCN-NEXT: s_lshr_b32 s0, s0, 7 125 ; GCN-NEXT: s_lshr_b32 s0, s0, s1 135 ; GCN-NEXT: s_lshr_b32 s0, s0, 7 164 ; GCN-NEXT: s_lshr_b32 s0, s0, s1 173 ; GCN-NEXT: s_lshr_b32 s0, s0, 31 234 ; GCN-NEXT: s_lshr_b32 s0, s0, s2 235 ; GCN-NEXT: s_lshr_b32 s1, s1, s3 [all …]
|
D | store-local.128.ll | 47 ; GFX9-NEXT: s_lshr_b32 s5, s0, 8 50 ; GFX9-NEXT: s_lshr_b32 s6, s0, 16 51 ; GFX9-NEXT: s_lshr_b32 s7, s0, 24 58 ; GFX9-NEXT: s_lshr_b32 s0, s1, 8 61 ; GFX9-NEXT: s_lshr_b32 s4, s1, 16 62 ; GFX9-NEXT: s_lshr_b32 s5, s1, 24 69 ; GFX9-NEXT: s_lshr_b32 s0, s2, 8 72 ; GFX9-NEXT: s_lshr_b32 s1, s2, 16 73 ; GFX9-NEXT: s_lshr_b32 s4, s2, 24 80 ; GFX9-NEXT: s_lshr_b32 s0, s3, 8 [all …]
|
D | store-local.96.ll | 45 ; GFX9-NEXT: s_lshr_b32 s3, s0, 8 48 ; GFX9-NEXT: s_lshr_b32 s5, s0, 16 49 ; GFX9-NEXT: s_lshr_b32 s6, s0, 24 56 ; GFX9-NEXT: s_lshr_b32 s0, s1, 8 59 ; GFX9-NEXT: s_lshr_b32 s3, s1, 16 60 ; GFX9-NEXT: s_lshr_b32 s4, s1, 24 67 ; GFX9-NEXT: s_lshr_b32 s0, s2, 8 70 ; GFX9-NEXT: s_lshr_b32 s1, s2, 16 73 ; GFX9-NEXT: s_lshr_b32 s3, s2, 24 87 ; GFX7-NEXT: s_lshr_b32 s3, s0, 8 [all …]
|
D | add.v2i16.ll | 154 ; GFX9-NEXT: s_lshr_b32 s1, s0, 16 163 ; GFX8-NEXT: s_lshr_b32 s2, s0, 16 180 ; GFX9-NEXT: s_lshr_b32 s1, s0, 16 189 ; GFX8-NEXT: s_lshr_b32 s1, s0, 16 205 ; GFX9-NEXT: s_lshr_b32 s1, s0, 16 214 ; GFX8-NEXT: s_lshr_b32 s1, s0, 16 230 ; GFX9-NEXT: s_lshr_b32 s2, s0, 16 231 ; GFX9-NEXT: s_lshr_b32 s3, s1, 16 240 ; GFX8-NEXT: s_lshr_b32 s2, s0, 16 241 ; GFX8-NEXT: s_lshr_b32 s4, s1, 16 [all …]
|
D | insertelement.i8.ll | 708 ; GFX9-NEXT: s_lshr_b32 s2, s1, 8 710 ; GFX9-NEXT: s_lshr_b32 s3, s1, 16 711 ; GFX9-NEXT: s_lshr_b32 s5, s1, 24 744 ; GFX8-NEXT: s_lshr_b32 s1, s0, 8 746 ; GFX8-NEXT: s_lshr_b32 s2, s0, 16 747 ; GFX8-NEXT: s_lshr_b32 s3, s0, 24 783 ; GFX7-NEXT: s_lshr_b32 s1, s0, 8 785 ; GFX7-NEXT: s_lshr_b32 s2, s0, 16 786 ; GFX7-NEXT: s_lshr_b32 s3, s0, 24 833 ; GFX9-NEXT: s_lshr_b32 s2, s1, 8 [all …]
|
D | extractelement.i8.ll | 12 ; GCN-NEXT: s_lshr_b32 s1, s0, 8 14 ; GCN-NEXT: s_lshr_b32 s2, s0, 16 15 ; GCN-NEXT: s_lshr_b32 s3, s0, 24 26 ; GCN-NEXT: s_lshr_b32 s0, s0, s1 183 ; GFX9-NEXT: s_lshr_b32 s1, s0, 8 185 ; GFX9-NEXT: s_lshr_b32 s2, s0, 16 186 ; GFX9-NEXT: s_lshr_b32 s3, s0, 24 206 ; GFX8-NEXT: s_lshr_b32 s1, s0, 8 208 ; GFX8-NEXT: s_lshr_b32 s2, s0, 16 209 ; GFX8-NEXT: s_lshr_b32 s3, s0, 24 [all …]
|
D | combine-shift-of-shifted-logic.ll | 44 ; CHECK-NEXT: s_lshr_b32 s0, s0, 4 56 ; CHECK-NEXT: s_lshr_b32 s0, s0, 8 69 ; CHECK-NEXT: s_lshr_b32 s0, s0, 5 159 ; CHECK-NEXT: s_lshr_b32 s0, s0, 4 183 ; CHECK-NEXT: s_lshr_b32 s0, s0, 5 272 ; CHECK-NEXT: s_lshr_b32 s0, s0, 4 285 ; CHECK-NEXT: s_lshr_b32 s0, s0, 6 297 ; CHECK-NEXT: s_lshr_b32 s0, s0, 5
|
D | ashr.ll | 548 ; GFX8-NEXT: s_lshr_b32 s2, s0, 16 549 ; GFX8-NEXT: s_lshr_b32 s3, s1, 16 563 ; GFX9-NEXT: s_lshr_b32 s2, s0, 16 564 ; GFX9-NEXT: s_lshr_b32 s3, s1, 16 592 ; GFX8-NEXT: s_lshr_b32 s1, s0, 16 626 ; GFX8-NEXT: s_lshr_b32 s1, s0, 16 730 ; GFX8-NEXT: s_lshr_b32 s4, s0, 16 731 ; GFX8-NEXT: s_lshr_b32 s6, s2, 16 732 ; GFX8-NEXT: s_lshr_b32 s5, s1, 16 733 ; GFX8-NEXT: s_lshr_b32 s7, s3, 16 [all …]
|
D | shl.ll | 555 ; GFX8-NEXT: s_lshr_b32 s2, s0, 16 556 ; GFX8-NEXT: s_lshr_b32 s4, s1, 16 568 ; GFX9-NEXT: s_lshr_b32 s2, s0, 16 569 ; GFX9-NEXT: s_lshr_b32 s3, s1, 16 595 ; GFX8-NEXT: s_lshr_b32 s1, s0, 16 627 ; GFX8-NEXT: s_lshr_b32 s1, s0, 16 724 ; GFX8-NEXT: s_lshr_b32 s4, s0, 16 725 ; GFX8-NEXT: s_lshr_b32 s7, s2, 16 730 ; GFX8-NEXT: s_lshr_b32 s5, s1, 16 731 ; GFX8-NEXT: s_lshr_b32 s8, s3, 16 [all …]
|
D | usubsat.ll | 57 ; GFX6-NEXT: s_lshr_b32 s0, s0, 25 145 ; GFX6-NEXT: s_lshr_b32 s0, s0, 24 264 ; GFX6-NEXT: s_lshr_b32 s2, s0, 8 265 ; GFX6-NEXT: s_lshr_b32 s3, s1, 8 272 ; GFX6-NEXT: s_lshr_b32 s0, s0, 24 277 ; GFX6-NEXT: s_lshr_b32 s1, s1, 24 285 ; GFX8-NEXT: s_lshr_b32 s3, s1, 8 287 ; GFX8-NEXT: s_lshr_b32 s2, s0, 8 303 ; GFX9-NEXT: s_lshr_b32 s2, s0, 8 304 ; GFX9-NEXT: s_lshr_b32 s3, s1, 8 [all …]
|
/external/llvm-project/llvm/test/CodeGen/AMDGPU/ |
D | store-local.128.ll | 68 ; GFX9-NEXT: s_lshr_b32 s4, s3, 8 72 ; GFX9-NEXT: s_lshr_b32 s3, s3, 24 75 ; GFX9-NEXT: s_lshr_b32 s3, s2, 8 78 ; GFX9-NEXT: s_lshr_b32 s2, s2, 24 81 ; GFX9-NEXT: s_lshr_b32 s2, s1, 8 84 ; GFX9-NEXT: s_lshr_b32 s1, s1, 24 87 ; GFX9-NEXT: s_lshr_b32 s1, s0, 8 90 ; GFX9-NEXT: s_lshr_b32 s0, s0, 24 110 ; GFX7-NEXT: s_lshr_b32 s4, s3, 8 113 ; GFX7-NEXT: s_lshr_b32 s4, s3, 24 [all …]
|
D | store-local.96.ll | 63 ; GFX9-NEXT: s_lshr_b32 s3, s2, 8 67 ; GFX9-NEXT: s_lshr_b32 s2, s2, 24 70 ; GFX9-NEXT: s_lshr_b32 s2, s1, 8 73 ; GFX9-NEXT: s_lshr_b32 s1, s1, 24 76 ; GFX9-NEXT: s_lshr_b32 s1, s0, 8 79 ; GFX9-NEXT: s_lshr_b32 s0, s0, 24 97 ; GFX7-NEXT: s_lshr_b32 s3, s2, 8 100 ; GFX7-NEXT: s_lshr_b32 s3, s2, 24 103 ; GFX7-NEXT: s_lshr_b32 s2, s2, 16 106 ; GFX7-NEXT: s_lshr_b32 s2, s1, 8 [all …]
|
D | extract_vector_elt-i8.ll | 17 ; SI: s_lshr_b32 s{{[0-9]+}}, s{{[0-9]+}}, 8 34 ; GCN: s_lshr_b32 s{{[0-9]+}}, s{{[0-9]+}}, 16 50 ; GCN: s_lshr_b32 s{{[0-9]+}}, s{{[0-9]+}}, 16 67 ; GCN: s_lshr_b32 s{{[0-9]+}}, [[VAL]], 16 82 ; GCN: s_lshr_b32 [[ELT2:s[0-9]+]], [[LOAD0]], 16 100 ; GCN: s_lshr_b32 [[ELT2:s[0-9]+]], [[VAL]], 16 116 ; GCN: s_lshr_b32 [[ELT2:s[0-9]+]], [[LOAD0]], 16 154 ; VI: s_lshr_b32 [[ELT:s[0-9]+]], [[LOAD]], [[SCALED_IDX]] 169 ; VI: s_lshr_b32 [[EXTRACT:s[0-9]+]], [[VEC4]], [[SCALED_IDX]] 201 ; GCN: s_lshr_b32 s{{[0-9]+}}, s{{[0-9]+}}, 8 [all …]
|
D | idot4u.ll | 34 ; GFX7-NEXT: s_lshr_b32 s5, s5, 24 36 ; GFX7-NEXT: s_lshr_b32 s4, s4, 24 64 ; GFX8-NEXT: s_lshr_b32 s4, s4, 24 66 ; GFX8-NEXT: s_lshr_b32 s3, s3, 24 97 ; GFX9-NODL-NEXT: s_lshr_b32 s4, s4, 24 99 ; GFX9-NODL-NEXT: s_lshr_b32 s3, s3, 24 197 ; GFX7-NEXT: s_lshr_b32 s5, s5, 24 199 ; GFX7-NEXT: s_lshr_b32 s4, s4, 24 229 ; GFX8-NEXT: s_lshr_b32 s2, s2, 24 231 ; GFX8-NEXT: s_lshr_b32 s1, s1, 24 [all …]
|
D | load-constant-i16.ll | 890 ; GCN-NOHSA-SI-NEXT: s_lshr_b32 s4, s2, 16 906 ; GCN-HSA-NEXT: s_lshr_b32 s0, s2, 16 923 ; GCN-NOHSA-VI-NEXT: s_lshr_b32 s0, s2, 16 1038 ; GCN-NOHSA-SI-NEXT: s_lshr_b32 s7, s4, 16 1058 ; GCN-HSA-NEXT: s_lshr_b32 s2, s0, 16 1078 ; GCN-NOHSA-VI-NEXT: s_lshr_b32 s6, s4, 16 1215 ; GCN-NOHSA-SI-NEXT: s_lshr_b32 s6, s5, 16 1216 ; GCN-NOHSA-SI-NEXT: s_lshr_b32 s7, s4, 16 1236 ; GCN-HSA-NEXT: s_lshr_b32 s2, s1, 16 1237 ; GCN-HSA-NEXT: s_lshr_b32 s3, s0, 16 [all …]
|
D | fshl.ll | 23 ; SI-NEXT: s_lshr_b32 s1, s2, 1 37 ; VI-NEXT: s_lshr_b32 s1, s4, 1 55 ; GFX9-NEXT: s_lshr_b32 s1, s4, 1 148 ; SI-NEXT: s_lshr_b32 s3, s3, 1 153 ; SI-NEXT: s_lshr_b32 s1, s2, 1 169 ; VI-NEXT: s_lshr_b32 s7, s5, 1 175 ; VI-NEXT: s_lshr_b32 s1, s4, 1 195 ; GFX9-NEXT: s_lshr_b32 s5, s5, 1 200 ; GFX9-NEXT: s_lshr_b32 s1, s4, 1 307 ; SI-NEXT: s_lshr_b32 s11, s11, 1 [all …]
|
D | idot2.ll | 24 ; GFX7-NEXT: s_lshr_b32 s6, s4, 16 25 ; GFX7-NEXT: s_lshr_b32 s7, s5, 16 49 ; GFX8-NEXT: s_lshr_b32 s3, s3, 16 51 ; GFX8-NEXT: s_lshr_b32 s4, s4, 16 74 ; GFX9-NODL-NEXT: s_lshr_b32 s3, s3, 16 76 ; GFX9-NODL-NEXT: s_lshr_b32 s4, s4, 16 156 ; GFX7-NEXT: s_lshr_b32 s6, s4, 16 160 ; GFX7-NEXT: s_lshr_b32 s7, s5, 16 183 ; GFX8-NEXT: s_lshr_b32 s3, s3, 16 184 ; GFX8-NEXT: s_lshr_b32 s4, s4, 16 [all …]
|
D | llvm.maxnum.f16.ll | 247 ; SI-NEXT: s_lshr_b32 s1, s6, 16 249 ; SI-NEXT: s_lshr_b32 s0, s0, 16 282 ; VI-NEXT: s_lshr_b32 s4, s4, 16 283 ; VI-NEXT: s_lshr_b32 s5, s5, 16 329 ; SI-NEXT: s_lshr_b32 s2, s2, 16 355 ; VI-NEXT: s_lshr_b32 s4, s4, 16 396 ; SI-NEXT: s_lshr_b32 s2, s2, 16 422 ; VI-NEXT: s_lshr_b32 s4, s4, 16 467 ; SI-NEXT: s_lshr_b32 s1, s6, 16 468 ; SI-NEXT: s_lshr_b32 s4, s8, 16 [all …]
|
D | llvm.minnum.f16.ll | 270 ; SI-NEXT: s_lshr_b32 s1, s6, 16 272 ; SI-NEXT: s_lshr_b32 s0, s0, 16 305 ; VI-NEXT: s_lshr_b32 s4, s4, 16 306 ; VI-NEXT: s_lshr_b32 s5, s5, 16 382 ; SI-NEXT: s_lshr_b32 s2, s2, 16 408 ; VI-NEXT: s_lshr_b32 s4, s4, 16 449 ; SI-NEXT: s_lshr_b32 s2, s2, 16 475 ; VI-NEXT: s_lshr_b32 s4, s4, 16 520 ; SI-NEXT: s_lshr_b32 s1, s6, 16 521 ; SI-NEXT: s_lshr_b32 s4, s8, 16 [all …]
|
D | llvm.amdgcn.raw.buffer.store.format.d16.ll | 18 ; UNPACKED-DAG: s_lshr_b32 [[SHR:s[0-9]+]], [[S_DATA]], 16 35 ; UNPACKED-DAG: s_lshr_b32 [[SHR0:s[0-9]+]], s[[S_DATA_0]], 16 60 ; UNPACKED-DAG: s_lshr_b32 [[SHR0:s[0-9]+]], s[[S_DATA_0]], 16 62 ; UNPACKED-DAG: s_lshr_b32 [[SHR1:s[0-9]+]], s[[S_DATA_1]], 16
|
D | llvm.amdgcn.tbuffer.store.d16.ll | 18 ; UNPACKED-DAG: s_lshr_b32 [[SHR:s[0-9]+]], [[S_DATA]], 16 35 ; UNPACKED-DAG: s_lshr_b32 [[SHR0:s[0-9]+]], s[[S_DATA_0]], 16 57 ; UNPACKED-DAG: s_lshr_b32 [[SHR0:s[0-9]+]], s[[S_DATA_0]], 16 59 ; UNPACKED-DAG: s_lshr_b32 [[SHR1:s[0-9]+]], s[[S_DATA_1]], 16
|
D | llvm.amdgcn.raw.tbuffer.store.d16.ll | 21 ; UNPACKED-DAG: s_lshr_b32 [[SHR:s[0-9]+]], [[S_DATA]], 16 39 ; UNPACKED-DAG: s_lshr_b32 [[SHR0:s[0-9]+]], s[[S_DATA_0]], 16 64 ; UNPACKED-DAG: s_lshr_b32 [[SHR0:s[0-9]+]], s[[S_DATA_0]], 16 66 ; UNPACKED-DAG: s_lshr_b32 [[SHR1:s[0-9]+]], s[[S_DATA_1]], 16
|
D | llvm.amdgcn.struct.buffer.store.format.d16.ll | 18 ; UNPACKED-DAG: s_lshr_b32 [[SHR:s[0-9]+]], [[S_DATA]], 16 35 ; UNPACKED-DAG: s_lshr_b32 [[SHR0:s[0-9]+]], s[[S_DATA_0]], 16 60 ; UNPACKED-DAG: s_lshr_b32 [[SHR0:s[0-9]+]], s[[S_DATA_0]], 16 62 ; UNPACKED-DAG: s_lshr_b32 [[SHR1:s[0-9]+]], s[[S_DATA_1]], 16
|
D | idot8u.ll | 25 ; GFX7-NEXT: s_lshr_b32 s7, s6, 28 33 ; GFX7-NEXT: s_lshr_b32 s5, s4, 28 78 ; GFX8-NEXT: s_lshr_b32 s7, s6, 28 86 ; GFX8-NEXT: s_lshr_b32 s3, s2, 28 131 ; GFX9-NEXT: s_lshr_b32 s7, s6, 28 139 ; GFX9-NEXT: s_lshr_b32 s3, s2, 28 299 ; GFX7-NEXT: s_lshr_b32 s6, s4, 28 306 ; GFX7-NEXT: s_lshr_b32 s13, s5, 28 352 ; GFX8-NEXT: s_lshr_b32 s2, s0, 28 359 ; GFX8-NEXT: s_lshr_b32 s9, s1, 28 [all …]
|
D | call-constant.ll | 9 ; SDAG: s_lshr_b32 31 ; SDAG: s_lshr_b32
|