Lines Matching refs:SI
1 ; RUN: llc -march=amdgcn -mcpu=SI -verify-machineinstrs < %s | FileCheck -check-prefix=SI %s
8 ; SI-LABEL @test_div_scale_f32_1:
9 ; SI-DAG: buffer_load_dword [[A:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64
10 ; SI-DAG: buffer_load_dword [[B:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64…
11 ; SI: v_div_scale_f32 [[RESULT0:v[0-9]+]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[B]], [[B]], [[A]]
12 ; SI: buffer_store_dword [[RESULT0]]
13 ; SI: s_endpgm
28 ; SI-LABEL @test_div_scale_f32_2:
29 ; SI-DAG: buffer_load_dword [[A:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64
30 ; SI-DAG: buffer_load_dword [[B:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64…
31 ; SI: v_div_scale_f32 [[RESULT0:v[0-9]+]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[A]], [[B]], [[A]]
32 ; SI: buffer_store_dword [[RESULT0]]
33 ; SI: s_endpgm
48 ; SI-LABEL @test_div_scale_f64_1:
49 ; SI-DAG: buffer_load_dwordx2 [[A:v\[[0-9]+:[0-9]+\]]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\…
50 ; SI-DAG: buffer_load_dwordx2 [[B:v\[[0-9]+:[0-9]+\]]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\…
51 ; SI: v_div_scale_f64 [[RESULT0:v\[[0-9]+:[0-9]+\]]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[B]], [[B]],…
52 ; SI: buffer_store_dwordx2 [[RESULT0]]
53 ; SI: s_endpgm
68 ; SI-LABEL @test_div_scale_f64_1:
69 ; SI-DAG: buffer_load_dwordx2 [[A:v\[[0-9]+:[0-9]+\]]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\…
70 ; SI-DAG: buffer_load_dwordx2 [[B:v\[[0-9]+:[0-9]+\]]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\…
71 ; SI: v_div_scale_f64 [[RESULT0:v\[[0-9]+:[0-9]+\]]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[A]], [[B]],…
72 ; SI: buffer_store_dwordx2 [[RESULT0]]
73 ; SI: s_endpgm
88 ; SI-LABEL @test_div_scale_f32_scalar_num_1:
89 ; SI-DAG: buffer_load_dword [[B:v[0-9]+]]
90 ; SI-DAG: s_load_dword [[A:s[0-9]+]]
91 ; SI: v_div_scale_f32 [[RESULT0:v[0-9]+]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[B]], [[B]], [[A]]
92 ; SI: buffer_store_dword [[RESULT0]]
93 ; SI: s_endpgm
106 ; SI-LABEL @test_div_scale_f32_scalar_num_2:
107 ; SI-DAG: buffer_load_dword [[B:v[0-9]+]]
108 ; SI-DAG: s_load_dword [[A:s[0-9]+]]
109 ; SI: v_div_scale_f32 [[RESULT0:v[0-9]+]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[A]], [[B]], [[A]]
110 ; SI: buffer_store_dword [[RESULT0]]
111 ; SI: s_endpgm
124 ; SI-LABEL @test_div_scale_f32_scalar_den_1:
125 ; SI-DAG: buffer_load_dword [[A:v[0-9]+]]
126 ; SI-DAG: s_load_dword [[B:s[0-9]+]]
127 ; SI: v_div_scale_f32 [[RESULT0:v[0-9]+]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[B]], [[B]], [[A]]
128 ; SI: buffer_store_dword [[RESULT0]]
129 ; SI: s_endpgm
142 ; SI-LABEL @test_div_scale_f32_scalar_den_2:
143 ; SI-DAG: buffer_load_dword [[A:v[0-9]+]]
144 ; SI-DAG: s_load_dword [[B:s[0-9]+]]
145 ; SI: v_div_scale_f32 [[RESULT0:v[0-9]+]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[A]], [[B]], [[A]]
146 ; SI: buffer_store_dword [[RESULT0]]
147 ; SI: s_endpgm
160 ; SI-LABEL @test_div_scale_f64_scalar_num_1:
161 ; SI-DAG: buffer_load_dwordx2 [[B:v\[[0-9]+:[0-9]+\]]]
162 ; SI-DAG: s_load_dwordx2 [[A:s\[[0-9]+:[0-9]+\]]], {{s\[[0-9]+:[0-9]+\]}}, 0xd
163 ; SI: v_div_scale_f64 [[RESULT0:v\[[0-9]+:[0-9]+\]]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[B]], [[B]],…
164 ; SI: buffer_store_dwordx2 [[RESULT0]]
165 ; SI: s_endpgm
178 ; SI-LABEL @test_div_scale_f64_scalar_num_2:
179 ; SI-DAG: s_load_dwordx2 [[A:s\[[0-9]+:[0-9]+\]]], {{s\[[0-9]+:[0-9]+\]}}, 0xd
180 ; SI-DAG: buffer_load_dwordx2 [[B:v\[[0-9]+:[0-9]+\]]]
181 ; SI: v_div_scale_f64 [[RESULT0:v\[[0-9]+:[0-9]+\]]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[A]], [[B]],…
182 ; SI: buffer_store_dwordx2 [[RESULT0]]
183 ; SI: s_endpgm
196 ; SI-LABEL @test_div_scale_f64_scalar_den_1:
197 ; SI-DAG: buffer_load_dwordx2 [[A:v\[[0-9]+:[0-9]+\]]]
198 ; SI-DAG: s_load_dwordx2 [[B:s\[[0-9]+:[0-9]+\]]], {{s\[[0-9]+:[0-9]+\]}}, 0xd
199 ; SI: v_div_scale_f64 [[RESULT0:v\[[0-9]+:[0-9]+\]]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[B]], [[B]],…
200 ; SI: buffer_store_dwordx2 [[RESULT0]]
201 ; SI: s_endpgm
214 ; SI-LABEL @test_div_scale_f64_scalar_den_2:
215 ; SI-DAG: buffer_load_dwordx2 [[A:v\[[0-9]+:[0-9]+\]]]
216 ; SI-DAG: s_load_dwordx2 [[B:s\[[0-9]+:[0-9]+\]]], {{s\[[0-9]+:[0-9]+\]}}, 0xd
217 ; SI: v_div_scale_f64 [[RESULT0:v\[[0-9]+:[0-9]+\]]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[A]], [[B]],…
218 ; SI: buffer_store_dwordx2 [[RESULT0]]
219 ; SI: s_endpgm
232 ; SI-LABEL @test_div_scale_f32_all_scalar_1:
233 ; SI-DAG: s_load_dword [[A:s[0-9]+]], {{s\[[0-9]+:[0-9]+\]}}, 0xb
234 ; SI-DAG: s_load_dword [[B:s[0-9]+]], {{s\[[0-9]+:[0-9]+\]}}, 0xc
235 ; SI: v_mov_b32_e32 [[VA:v[0-9]+]], [[A]]
236 ; SI: v_div_scale_f32 [[RESULT0:v[0-9]+]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[B]], [[B]], [[VA]]
237 ; SI: buffer_store_dword [[RESULT0]]
238 ; SI: s_endpgm
246 ; SI-LABEL @test_div_scale_f32_all_scalar_2:
247 ; SI-DAG: s_load_dword [[A:s[0-9]+]], {{s\[[0-9]+:[0-9]+\]}}, 0xb
248 ; SI-DAG: s_load_dword [[B:s[0-9]+]], {{s\[[0-9]+:[0-9]+\]}}, 0xc
249 ; SI: v_mov_b32_e32 [[VB:v[0-9]+]], [[B]]
250 ; SI: v_div_scale_f32 [[RESULT0:v[0-9]+]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[A]], [[VB]], [[A]]
251 ; SI: buffer_store_dword [[RESULT0]]
252 ; SI: s_endpgm
260 ; SI-LABEL @test_div_scale_f64_all_scalar_1:
261 ; SI-DAG: s_load_dwordx2 s{{\[}}[[A_LO:[0-9]+]]:[[A_HI:[0-9]+]]{{\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0xb
262 ; SI-DAG: s_load_dwordx2 [[B:s\[[0-9]+:[0-9]+\]]], {{s\[[0-9]+:[0-9]+\]}}, 0xd
263 ; SI-DAG: v_mov_b32_e32 v[[VA_LO:[0-9]+]], s[[A_LO]]
264 ; SI-DAG: v_mov_b32_e32 v[[VA_HI:[0-9]+]], s[[A_HI]]
265 ; SI: v_div_scale_f64 [[RESULT0:v\[[0-9]+:[0-9]+\]]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[B]], [[B]],…
266 ; SI: buffer_store_dwordx2 [[RESULT0]]
267 ; SI: s_endpgm
275 ; SI-LABEL @test_div_scale_f64_all_scalar_2:
276 ; SI-DAG: s_load_dwordx2 [[A:s\[[0-9]+:[0-9]+\]]], {{s\[[0-9]+:[0-9]+\]}}, 0xb
277 ; SI-DAG: s_load_dwordx2 s{{\[}}[[B_LO:[0-9]+]]:[[B_HI:[0-9]+]]{{\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0xd
278 ; SI-DAG: v_mov_b32_e32 v[[VB_LO:[0-9]+]], s[[B_LO]]
279 ; SI-DAG: v_mov_b32_e32 v[[VB_HI:[0-9]+]], s[[B_HI]]
280 ; SI: v_div_scale_f64 [[RESULT0:v\[[0-9]+:[0-9]+\]]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[A]], v{{\[}…
281 ; SI: buffer_store_dwordx2 [[RESULT0]]
282 ; SI: s_endpgm
290 ; SI-LABEL @test_div_scale_f32_inline_imm_num:
291 ; SI-DAG: buffer_load_dword [[A:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64…
292 ; SI: v_div_scale_f32 [[RESULT0:v[0-9]+]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[A]], [[A]], 1.0
293 ; SI: buffer_store_dword [[RESULT0]]
294 ; SI: s_endpgm
306 ; SI-LABEL @test_div_scale_f32_inline_imm_den:
307 ; SI-DAG: buffer_load_dword [[A:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64…
308 ; SI: v_div_scale_f32 [[RESULT0:v[0-9]+]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], 2.0, 2.0, [[A]]
309 ; SI: buffer_store_dword [[RESULT0]]
310 ; SI: s_endpgm
322 ; SI-LABEL @test_div_scale_f32_fabs_num:
323 ; SI-DAG: buffer_load_dword [[A:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64
324 ; SI-DAG: buffer_load_dword [[B:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64…
325 ; SI: v_div_scale_f32 [[RESULT0:v[0-9]+]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], [[B]], [[B]], |[[A]]|
326 ; SI: buffer_store_dword [[RESULT0]]
327 ; SI: s_endpgm
344 ; SI-LABEL @test_div_scale_f32_fabs_den:
345 ; SI-DAG: buffer_load_dword [[A:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64
346 ; SI-DAG: buffer_load_dword [[B:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64…
347 ; SI: v_div_scale_f32 [[RESULT0:v[0-9]+]], [[RESULT1:s\[[0-9]+:[0-9]+\]]], |[[B]]|, |[[B]]|, [[A]]
348 ; SI: buffer_store_dword [[RESULT0]]
349 ; SI: s_endpgm