xref: /aosp_15_r20/external/llvm/test/CodeGen/X86/vshift-4.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=x86 -mcpu=core2 | FileCheck %s
2*9880d681SAndroid Build Coastguard Worker
3*9880d681SAndroid Build Coastguard Worker; test vector shifts converted to proper SSE2 vector shifts when the shift
4*9880d681SAndroid Build Coastguard Worker; amounts are the same when using a shuffle splat.
5*9880d681SAndroid Build Coastguard Worker
6*9880d681SAndroid Build Coastguard Workerdefine void @shift1a(<2 x i64> %val, <2 x i64>* %dst, <2 x i64> %sh) nounwind {
7*9880d681SAndroid Build Coastguard Workerentry:
8*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift1a:
9*9880d681SAndroid Build Coastguard Worker; CHECK: psllq
10*9880d681SAndroid Build Coastguard Worker  %shamt = shufflevector <2 x i64> %sh, <2 x i64> undef, <2 x i32> <i32 0, i32 0>
11*9880d681SAndroid Build Coastguard Worker  %shl = shl <2 x i64> %val, %shamt
12*9880d681SAndroid Build Coastguard Worker  store <2 x i64> %shl, <2 x i64>* %dst
13*9880d681SAndroid Build Coastguard Worker  ret void
14*9880d681SAndroid Build Coastguard Worker}
15*9880d681SAndroid Build Coastguard Worker
16*9880d681SAndroid Build Coastguard Worker; shift1b can't use a packed shift but can shift lanes separately and shuffle back together
17*9880d681SAndroid Build Coastguard Workerdefine void @shift1b(<2 x i64> %val, <2 x i64>* %dst, <2 x i64> %sh) nounwind {
18*9880d681SAndroid Build Coastguard Workerentry:
19*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift1b:
20*9880d681SAndroid Build Coastguard Worker; CHECK:       pshufd {{.*#+}} xmm2 = xmm1[2,3,0,1]
21*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT:  movdqa %xmm0, %xmm3
22*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT:  psllq  %xmm2, %xmm3
23*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT:  movq   {{.*#+}} xmm1 = xmm1[0],zero
24*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT:  psllq  %xmm1, %xmm0
25*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT:  movsd  {{.*#+}} xmm3 = xmm0[0],xmm3[1]
26*9880d681SAndroid Build Coastguard Worker  %shamt = shufflevector <2 x i64> %sh, <2 x i64> undef, <2 x i32> <i32 0, i32 1>
27*9880d681SAndroid Build Coastguard Worker  %shl = shl <2 x i64> %val, %shamt
28*9880d681SAndroid Build Coastguard Worker  store <2 x i64> %shl, <2 x i64>* %dst
29*9880d681SAndroid Build Coastguard Worker  ret void
30*9880d681SAndroid Build Coastguard Worker}
31*9880d681SAndroid Build Coastguard Worker
32*9880d681SAndroid Build Coastguard Workerdefine void @shift2a(<4 x i32> %val, <4 x i32>* %dst, <2 x i32> %amt) nounwind {
33*9880d681SAndroid Build Coastguard Workerentry:
34*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift2a:
35*9880d681SAndroid Build Coastguard Worker; CHECK: pslld
36*9880d681SAndroid Build Coastguard Worker  %shamt = shufflevector <2 x i32> %amt, <2 x i32> undef, <4 x i32> <i32 1, i32 1, i32 1, i32 1>
37*9880d681SAndroid Build Coastguard Worker  %shl = shl <4 x i32> %val, %shamt
38*9880d681SAndroid Build Coastguard Worker  store <4 x i32> %shl, <4 x i32>* %dst
39*9880d681SAndroid Build Coastguard Worker  ret void
40*9880d681SAndroid Build Coastguard Worker}
41*9880d681SAndroid Build Coastguard Worker
42*9880d681SAndroid Build Coastguard Workerdefine void @shift2b(<4 x i32> %val, <4 x i32>* %dst, <2 x i32> %amt) nounwind {
43*9880d681SAndroid Build Coastguard Workerentry:
44*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift2b:
45*9880d681SAndroid Build Coastguard Worker; CHECK: pslld
46*9880d681SAndroid Build Coastguard Worker  %shamt = shufflevector <2 x i32> %amt, <2 x i32> undef, <4 x i32> <i32 1, i32 undef, i32 1, i32 1>
47*9880d681SAndroid Build Coastguard Worker  %shl = shl <4 x i32> %val, %shamt
48*9880d681SAndroid Build Coastguard Worker  store <4 x i32> %shl, <4 x i32>* %dst
49*9880d681SAndroid Build Coastguard Worker  ret void
50*9880d681SAndroid Build Coastguard Worker}
51*9880d681SAndroid Build Coastguard Worker
52*9880d681SAndroid Build Coastguard Workerdefine void @shift2c(<4 x i32> %val, <4 x i32>* %dst, <2 x i32> %amt) nounwind {
53*9880d681SAndroid Build Coastguard Workerentry:
54*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift2c:
55*9880d681SAndroid Build Coastguard Worker; CHECK: pslld
56*9880d681SAndroid Build Coastguard Worker  %shamt = shufflevector <2 x i32> %amt, <2 x i32> undef, <4 x i32> <i32 1, i32 1, i32 1, i32 1>
57*9880d681SAndroid Build Coastguard Worker  %shl = shl <4 x i32> %val, %shamt
58*9880d681SAndroid Build Coastguard Worker  store <4 x i32> %shl, <4 x i32>* %dst
59*9880d681SAndroid Build Coastguard Worker  ret void
60*9880d681SAndroid Build Coastguard Worker}
61*9880d681SAndroid Build Coastguard Worker
62*9880d681SAndroid Build Coastguard Workerdefine void @shift3a(<8 x i16> %val, <8 x i16>* %dst, <8 x i16> %amt) nounwind {
63*9880d681SAndroid Build Coastguard Workerentry:
64*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift3a:
65*9880d681SAndroid Build Coastguard Worker; CHECK: pextrw $6
66*9880d681SAndroid Build Coastguard Worker; CHECK: psllw
67*9880d681SAndroid Build Coastguard Worker  %shamt = shufflevector <8 x i16> %amt, <8 x i16> undef, <8 x i32> <i32 6, i32 6, i32 6, i32 6, i32 6, i32 6, i32 6, i32 6>
68*9880d681SAndroid Build Coastguard Worker  %shl = shl <8 x i16> %val, %shamt
69*9880d681SAndroid Build Coastguard Worker  store <8 x i16> %shl, <8 x i16>* %dst
70*9880d681SAndroid Build Coastguard Worker  ret void
71*9880d681SAndroid Build Coastguard Worker}
72*9880d681SAndroid Build Coastguard Worker
73*9880d681SAndroid Build Coastguard Workerdefine void @shift3b(<8 x i16> %val, <8 x i16>* %dst, i16 %amt) nounwind {
74*9880d681SAndroid Build Coastguard Workerentry:
75*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: shift3b:
76*9880d681SAndroid Build Coastguard Worker; CHECK: movzwl
77*9880d681SAndroid Build Coastguard Worker; CHECK: psllw
78*9880d681SAndroid Build Coastguard Worker  %0 = insertelement <8 x i16> undef, i16 %amt, i32 0
79*9880d681SAndroid Build Coastguard Worker  %1 = insertelement <8 x i16> %0, i16 %amt, i32 1
80*9880d681SAndroid Build Coastguard Worker  %2 = insertelement <8 x i16> %1, i16 %amt, i32 2
81*9880d681SAndroid Build Coastguard Worker  %3 = insertelement <8 x i16> %2, i16 %amt, i32 3
82*9880d681SAndroid Build Coastguard Worker  %4 = insertelement <8 x i16> %3, i16 %amt, i32 4
83*9880d681SAndroid Build Coastguard Worker  %5 = insertelement <8 x i16> %4, i16 %amt, i32 5
84*9880d681SAndroid Build Coastguard Worker  %6 = insertelement <8 x i16> %5, i16 %amt, i32 6
85*9880d681SAndroid Build Coastguard Worker  %7 = insertelement <8 x i16> %6, i16 %amt, i32 7
86*9880d681SAndroid Build Coastguard Worker  %shl = shl <8 x i16> %val, %7
87*9880d681SAndroid Build Coastguard Worker  store <8 x i16> %shl, <8 x i16>* %dst
88*9880d681SAndroid Build Coastguard Worker  ret void
89*9880d681SAndroid Build Coastguard Worker}
90*9880d681SAndroid Build Coastguard Worker
91