1; RUN: llc < %s -march=x86 -mcpu=core2 -o %t
2; RUN: grep pshufb %t | count 1
3
4; FIXME: this test has a superfluous punpcklqdq pre-pshufb currently.
5;        Don't XFAIL it because it's still better than the previous code.
6
7; Pack various elements via shuffles.
8define <8 x i16> @shuf1(<8 x i16> %T0, <8 x i16> %T1) nounwind readnone {
9entry:
10	%tmp7 = shufflevector <8 x i16> %T0, <8 x i16> %T1, <8 x i32> < i32 1, i32 8, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef , i32 undef >
11	ret <8 x i16> %tmp7
12}
13