1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=x86 -mcpu=core2 | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker 3*9880d681SAndroid Build Coastguard Worker; test vector shifts converted to proper SSE2 vector shifts when the shift 4*9880d681SAndroid Build Coastguard Worker; amounts are the same when using a shuffle splat. 5*9880d681SAndroid Build Coastguard Worker 6*9880d681SAndroid Build Coastguard Workerdefine void @shift1a(<2 x i64> %val, <2 x i64>* %dst, <2 x i64> %sh) nounwind { 7*9880d681SAndroid Build Coastguard Workerentry: 8*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift1a: 9*9880d681SAndroid Build Coastguard Worker; CHECK: psllq 10*9880d681SAndroid Build Coastguard Worker %shamt = shufflevector <2 x i64> %sh, <2 x i64> undef, <2 x i32> <i32 0, i32 0> 11*9880d681SAndroid Build Coastguard Worker %shl = shl <2 x i64> %val, %shamt 12*9880d681SAndroid Build Coastguard Worker store <2 x i64> %shl, <2 x i64>* %dst 13*9880d681SAndroid Build Coastguard Worker ret void 14*9880d681SAndroid Build Coastguard Worker} 15*9880d681SAndroid Build Coastguard Worker 16*9880d681SAndroid Build Coastguard Worker; shift1b can't use a packed shift but can shift lanes separately and shuffle back together 17*9880d681SAndroid Build Coastguard Workerdefine void @shift1b(<2 x i64> %val, <2 x i64>* %dst, <2 x i64> %sh) nounwind { 18*9880d681SAndroid Build Coastguard Workerentry: 19*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift1b: 20*9880d681SAndroid Build Coastguard Worker; CHECK: pshufd {{.*#+}} xmm2 = xmm1[2,3,0,1] 21*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: movdqa %xmm0, %xmm3 22*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: psllq %xmm2, %xmm3 23*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: movq {{.*#+}} xmm1 = xmm1[0],zero 24*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: psllq %xmm1, %xmm0 25*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: movsd {{.*#+}} xmm3 = xmm0[0],xmm3[1] 26*9880d681SAndroid Build Coastguard Worker %shamt = shufflevector <2 x i64> %sh, <2 x i64> undef, <2 x i32> <i32 0, i32 1> 27*9880d681SAndroid Build Coastguard Worker %shl = shl <2 x i64> %val, %shamt 28*9880d681SAndroid Build Coastguard Worker store <2 x i64> %shl, <2 x i64>* %dst 29*9880d681SAndroid Build Coastguard Worker ret void 30*9880d681SAndroid Build Coastguard Worker} 31*9880d681SAndroid Build Coastguard Worker 32*9880d681SAndroid Build Coastguard Workerdefine void @shift2a(<4 x i32> %val, <4 x i32>* %dst, <2 x i32> %amt) nounwind { 33*9880d681SAndroid Build Coastguard Workerentry: 34*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift2a: 35*9880d681SAndroid Build Coastguard Worker; CHECK: pslld 36*9880d681SAndroid Build Coastguard Worker %shamt = shufflevector <2 x i32> %amt, <2 x i32> undef, <4 x i32> <i32 1, i32 1, i32 1, i32 1> 37*9880d681SAndroid Build Coastguard Worker %shl = shl <4 x i32> %val, %shamt 38*9880d681SAndroid Build Coastguard Worker store <4 x i32> %shl, <4 x i32>* %dst 39*9880d681SAndroid Build Coastguard Worker ret void 40*9880d681SAndroid Build Coastguard Worker} 41*9880d681SAndroid Build Coastguard Worker 42*9880d681SAndroid Build Coastguard Workerdefine void @shift2b(<4 x i32> %val, <4 x i32>* %dst, <2 x i32> %amt) nounwind { 43*9880d681SAndroid Build Coastguard Workerentry: 44*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift2b: 45*9880d681SAndroid Build Coastguard Worker; CHECK: pslld 46*9880d681SAndroid Build Coastguard Worker %shamt = shufflevector <2 x i32> %amt, <2 x i32> undef, <4 x i32> <i32 1, i32 undef, i32 1, i32 1> 47*9880d681SAndroid Build Coastguard Worker %shl = shl <4 x i32> %val, %shamt 48*9880d681SAndroid Build Coastguard Worker store <4 x i32> %shl, <4 x i32>* %dst 49*9880d681SAndroid Build Coastguard Worker ret void 50*9880d681SAndroid Build Coastguard Worker} 51*9880d681SAndroid Build Coastguard Worker 52*9880d681SAndroid Build Coastguard Workerdefine void @shift2c(<4 x i32> %val, <4 x i32>* %dst, <2 x i32> %amt) nounwind { 53*9880d681SAndroid Build Coastguard Workerentry: 54*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift2c: 55*9880d681SAndroid Build Coastguard Worker; CHECK: pslld 56*9880d681SAndroid Build Coastguard Worker %shamt = shufflevector <2 x i32> %amt, <2 x i32> undef, <4 x i32> <i32 1, i32 1, i32 1, i32 1> 57*9880d681SAndroid Build Coastguard Worker %shl = shl <4 x i32> %val, %shamt 58*9880d681SAndroid Build Coastguard Worker store <4 x i32> %shl, <4 x i32>* %dst 59*9880d681SAndroid Build Coastguard Worker ret void 60*9880d681SAndroid Build Coastguard Worker} 61*9880d681SAndroid Build Coastguard Worker 62*9880d681SAndroid Build Coastguard Workerdefine void @shift3a(<8 x i16> %val, <8 x i16>* %dst, <8 x i16> %amt) nounwind { 63*9880d681SAndroid Build Coastguard Workerentry: 64*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift3a: 65*9880d681SAndroid Build Coastguard Worker; CHECK: pextrw $6 66*9880d681SAndroid Build Coastguard Worker; CHECK: psllw 67*9880d681SAndroid Build Coastguard Worker %shamt = shufflevector <8 x i16> %amt, <8 x i16> undef, <8 x i32> <i32 6, i32 6, i32 6, i32 6, i32 6, i32 6, i32 6, i32 6> 68*9880d681SAndroid Build Coastguard Worker %shl = shl <8 x i16> %val, %shamt 69*9880d681SAndroid Build Coastguard Worker store <8 x i16> %shl, <8 x i16>* %dst 70*9880d681SAndroid Build Coastguard Worker ret void 71*9880d681SAndroid Build Coastguard Worker} 72*9880d681SAndroid Build Coastguard Worker 73*9880d681SAndroid Build Coastguard Workerdefine void @shift3b(<8 x i16> %val, <8 x i16>* %dst, i16 %amt) nounwind { 74*9880d681SAndroid Build Coastguard Workerentry: 75*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift3b: 76*9880d681SAndroid Build Coastguard Worker; CHECK: movzwl 77*9880d681SAndroid Build Coastguard Worker; CHECK: psllw 78*9880d681SAndroid Build Coastguard Worker %0 = insertelement <8 x i16> undef, i16 %amt, i32 0 79*9880d681SAndroid Build Coastguard Worker %1 = insertelement <8 x i16> %0, i16 %amt, i32 1 80*9880d681SAndroid Build Coastguard Worker %2 = insertelement <8 x i16> %1, i16 %amt, i32 2 81*9880d681SAndroid Build Coastguard Worker %3 = insertelement <8 x i16> %2, i16 %amt, i32 3 82*9880d681SAndroid Build Coastguard Worker %4 = insertelement <8 x i16> %3, i16 %amt, i32 4 83*9880d681SAndroid Build Coastguard Worker %5 = insertelement <8 x i16> %4, i16 %amt, i32 5 84*9880d681SAndroid Build Coastguard Worker %6 = insertelement <8 x i16> %5, i16 %amt, i32 6 85*9880d681SAndroid Build Coastguard Worker %7 = insertelement <8 x i16> %6, i16 %amt, i32 7 86*9880d681SAndroid Build Coastguard Worker %shl = shl <8 x i16> %val, %7 87*9880d681SAndroid Build Coastguard Worker store <8 x i16> %shl, <8 x i16>* %dst 88*9880d681SAndroid Build Coastguard Worker ret void 89*9880d681SAndroid Build Coastguard Worker} 90*9880d681SAndroid Build Coastguard Worker 91