1; RUN: llc -march=amdgcn -mcpu=gfx802 -verify-machineinstrs < %s | FileCheck %s
2
3; CHECK: s_waitcnt
4define <2 x i16> @main(<2 x float>) #0 {
5  %2 = bitcast <2 x float> %0 to <4 x i16>
6  %3 = shufflevector <4 x i16> %2, <4 x i16> undef, <2 x i32> <i32 0, i32 undef>
7  %4 = extractelement <4 x i16> %2, i32 0
8  %5 = insertelement <2 x i16> %3, i16 %4, i32 0
9  ret <2 x i16> %5
10}
11
12