xref: /aosp_15_r20/external/llvm/test/CodeGen/SystemZ/vec-perm-03.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; Test replications of a scalar memory value, represented as splats.
2*9880d681SAndroid Build Coastguard Worker;
3*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z13 | FileCheck %s
4*9880d681SAndroid Build Coastguard Worker
5*9880d681SAndroid Build Coastguard Worker; Test a v16i8 replicating load with no offset.
6*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @f1(i8 *%ptr) {
7*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f1:
8*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepb %v24, 0(%r2)
9*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
10*9880d681SAndroid Build Coastguard Worker  %scalar = load i8, i8 *%ptr
11*9880d681SAndroid Build Coastguard Worker  %val = insertelement <16 x i8> undef, i8 %scalar, i32 0
12*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <16 x i8> %val, <16 x i8> undef,
13*9880d681SAndroid Build Coastguard Worker                       <16 x i32> zeroinitializer
14*9880d681SAndroid Build Coastguard Worker  ret <16 x i8> %ret
15*9880d681SAndroid Build Coastguard Worker}
16*9880d681SAndroid Build Coastguard Worker
17*9880d681SAndroid Build Coastguard Worker; Test a v16i8 replicating load with the maximum in-range offset.
18*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @f2(i8 *%base) {
19*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f2:
20*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepb %v24, 4095(%r2)
21*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
22*9880d681SAndroid Build Coastguard Worker  %ptr = getelementptr i8, i8 *%base, i64 4095
23*9880d681SAndroid Build Coastguard Worker  %scalar = load i8, i8 *%ptr
24*9880d681SAndroid Build Coastguard Worker  %val = insertelement <16 x i8> undef, i8 %scalar, i32 0
25*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <16 x i8> %val, <16 x i8> undef,
26*9880d681SAndroid Build Coastguard Worker                       <16 x i32> zeroinitializer
27*9880d681SAndroid Build Coastguard Worker  ret <16 x i8> %ret
28*9880d681SAndroid Build Coastguard Worker}
29*9880d681SAndroid Build Coastguard Worker
30*9880d681SAndroid Build Coastguard Worker; Test a v16i8 replicating load with the first out-of-range offset.
31*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @f3(i8 *%base) {
32*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f3:
33*9880d681SAndroid Build Coastguard Worker; CHECK: aghi %r2, 4096
34*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepb %v24, 0(%r2)
35*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
36*9880d681SAndroid Build Coastguard Worker  %ptr = getelementptr i8, i8 *%base, i64 4096
37*9880d681SAndroid Build Coastguard Worker  %scalar = load i8, i8 *%ptr
38*9880d681SAndroid Build Coastguard Worker  %val = insertelement <16 x i8> undef, i8 %scalar, i32 0
39*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <16 x i8> %val, <16 x i8> undef,
40*9880d681SAndroid Build Coastguard Worker                       <16 x i32> zeroinitializer
41*9880d681SAndroid Build Coastguard Worker  ret <16 x i8> %ret
42*9880d681SAndroid Build Coastguard Worker}
43*9880d681SAndroid Build Coastguard Worker
44*9880d681SAndroid Build Coastguard Worker; Test a v8i16 replicating load with no offset.
45*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @f4(i16 *%ptr) {
46*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f4:
47*9880d681SAndroid Build Coastguard Worker; CHECK: vlreph %v24, 0(%r2)
48*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
49*9880d681SAndroid Build Coastguard Worker  %scalar = load i16, i16 *%ptr
50*9880d681SAndroid Build Coastguard Worker  %val = insertelement <8 x i16> undef, i16 %scalar, i32 0
51*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <8 x i16> %val, <8 x i16> undef,
52*9880d681SAndroid Build Coastguard Worker                       <8 x i32> zeroinitializer
53*9880d681SAndroid Build Coastguard Worker  ret <8 x i16> %ret
54*9880d681SAndroid Build Coastguard Worker}
55*9880d681SAndroid Build Coastguard Worker
56*9880d681SAndroid Build Coastguard Worker; Test a v8i16 replicating load with the maximum in-range offset.
57*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @f5(i16 *%base) {
58*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f5:
59*9880d681SAndroid Build Coastguard Worker; CHECK: vlreph %v24, 4094(%r2)
60*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
61*9880d681SAndroid Build Coastguard Worker  %ptr = getelementptr i16, i16 *%base, i64 2047
62*9880d681SAndroid Build Coastguard Worker  %scalar = load i16, i16 *%ptr
63*9880d681SAndroid Build Coastguard Worker  %val = insertelement <8 x i16> undef, i16 %scalar, i32 0
64*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <8 x i16> %val, <8 x i16> undef,
65*9880d681SAndroid Build Coastguard Worker                       <8 x i32> zeroinitializer
66*9880d681SAndroid Build Coastguard Worker  ret <8 x i16> %ret
67*9880d681SAndroid Build Coastguard Worker}
68*9880d681SAndroid Build Coastguard Worker
69*9880d681SAndroid Build Coastguard Worker; Test a v8i16 replicating load with the first out-of-range offset.
70*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @f6(i16 *%base) {
71*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f6:
72*9880d681SAndroid Build Coastguard Worker; CHECK: aghi %r2, 4096
73*9880d681SAndroid Build Coastguard Worker; CHECK: vlreph %v24, 0(%r2)
74*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
75*9880d681SAndroid Build Coastguard Worker  %ptr = getelementptr i16, i16 *%base, i64 2048
76*9880d681SAndroid Build Coastguard Worker  %scalar = load i16, i16 *%ptr
77*9880d681SAndroid Build Coastguard Worker  %val = insertelement <8 x i16> undef, i16 %scalar, i32 0
78*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <8 x i16> %val, <8 x i16> undef,
79*9880d681SAndroid Build Coastguard Worker                       <8 x i32> zeroinitializer
80*9880d681SAndroid Build Coastguard Worker  ret <8 x i16> %ret
81*9880d681SAndroid Build Coastguard Worker}
82*9880d681SAndroid Build Coastguard Worker
83*9880d681SAndroid Build Coastguard Worker; Test a v4i32 replicating load with no offset.
84*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @f7(i32 *%ptr) {
85*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f7:
86*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepf %v24, 0(%r2)
87*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
88*9880d681SAndroid Build Coastguard Worker  %scalar = load i32, i32 *%ptr
89*9880d681SAndroid Build Coastguard Worker  %val = insertelement <4 x i32> undef, i32 %scalar, i32 0
90*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <4 x i32> %val, <4 x i32> undef,
91*9880d681SAndroid Build Coastguard Worker                       <4 x i32> zeroinitializer
92*9880d681SAndroid Build Coastguard Worker  ret <4 x i32> %ret
93*9880d681SAndroid Build Coastguard Worker}
94*9880d681SAndroid Build Coastguard Worker
95*9880d681SAndroid Build Coastguard Worker; Test a v4i32 replicating load with the maximum in-range offset.
96*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @f8(i32 *%base) {
97*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f8:
98*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepf %v24, 4092(%r2)
99*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
100*9880d681SAndroid Build Coastguard Worker  %ptr = getelementptr i32, i32 *%base, i64 1023
101*9880d681SAndroid Build Coastguard Worker  %scalar = load i32, i32 *%ptr
102*9880d681SAndroid Build Coastguard Worker  %val = insertelement <4 x i32> undef, i32 %scalar, i32 0
103*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <4 x i32> %val, <4 x i32> undef,
104*9880d681SAndroid Build Coastguard Worker                       <4 x i32> zeroinitializer
105*9880d681SAndroid Build Coastguard Worker  ret <4 x i32> %ret
106*9880d681SAndroid Build Coastguard Worker}
107*9880d681SAndroid Build Coastguard Worker
108*9880d681SAndroid Build Coastguard Worker; Test a v4i32 replicating load with the first out-of-range offset.
109*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @f9(i32 *%base) {
110*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f9:
111*9880d681SAndroid Build Coastguard Worker; CHECK: aghi %r2, 4096
112*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepf %v24, 0(%r2)
113*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
114*9880d681SAndroid Build Coastguard Worker  %ptr = getelementptr i32, i32 *%base, i64 1024
115*9880d681SAndroid Build Coastguard Worker  %scalar = load i32, i32 *%ptr
116*9880d681SAndroid Build Coastguard Worker  %val = insertelement <4 x i32> undef, i32 %scalar, i32 0
117*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <4 x i32> %val, <4 x i32> undef,
118*9880d681SAndroid Build Coastguard Worker                       <4 x i32> zeroinitializer
119*9880d681SAndroid Build Coastguard Worker  ret <4 x i32> %ret
120*9880d681SAndroid Build Coastguard Worker}
121*9880d681SAndroid Build Coastguard Worker
122*9880d681SAndroid Build Coastguard Worker; Test a v2i64 replicating load with no offset.
123*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @f10(i64 *%ptr) {
124*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f10:
125*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepg %v24, 0(%r2)
126*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
127*9880d681SAndroid Build Coastguard Worker  %scalar = load i64, i64 *%ptr
128*9880d681SAndroid Build Coastguard Worker  %val = insertelement <2 x i64> undef, i64 %scalar, i32 0
129*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <2 x i64> %val, <2 x i64> undef,
130*9880d681SAndroid Build Coastguard Worker                       <2 x i32> zeroinitializer
131*9880d681SAndroid Build Coastguard Worker  ret <2 x i64> %ret
132*9880d681SAndroid Build Coastguard Worker}
133*9880d681SAndroid Build Coastguard Worker
134*9880d681SAndroid Build Coastguard Worker; Test a v2i64 replicating load with the maximum in-range offset.
135*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @f11(i64 *%base) {
136*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f11:
137*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepg %v24, 4088(%r2)
138*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
139*9880d681SAndroid Build Coastguard Worker  %ptr = getelementptr i64, i64 *%base, i32 511
140*9880d681SAndroid Build Coastguard Worker  %scalar = load i64, i64 *%ptr
141*9880d681SAndroid Build Coastguard Worker  %val = insertelement <2 x i64> undef, i64 %scalar, i32 0
142*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <2 x i64> %val, <2 x i64> undef,
143*9880d681SAndroid Build Coastguard Worker                       <2 x i32> zeroinitializer
144*9880d681SAndroid Build Coastguard Worker  ret <2 x i64> %ret
145*9880d681SAndroid Build Coastguard Worker}
146*9880d681SAndroid Build Coastguard Worker
147*9880d681SAndroid Build Coastguard Worker; Test a v2i64 replicating load with the first out-of-range offset.
148*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @f12(i64 *%base) {
149*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f12:
150*9880d681SAndroid Build Coastguard Worker; CHECK: aghi %r2, 4096
151*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepg %v24, 0(%r2)
152*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
153*9880d681SAndroid Build Coastguard Worker  %ptr = getelementptr i64, i64 *%base, i32 512
154*9880d681SAndroid Build Coastguard Worker  %scalar = load i64, i64 *%ptr
155*9880d681SAndroid Build Coastguard Worker  %val = insertelement <2 x i64> undef, i64 %scalar, i32 0
156*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <2 x i64> %val, <2 x i64> undef,
157*9880d681SAndroid Build Coastguard Worker                       <2 x i32> zeroinitializer
158*9880d681SAndroid Build Coastguard Worker  ret <2 x i64> %ret
159*9880d681SAndroid Build Coastguard Worker}
160*9880d681SAndroid Build Coastguard Worker
161*9880d681SAndroid Build Coastguard Worker; Test a v4f32 replicating load with no offset.
162*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @f13(float *%ptr) {
163*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f13:
164*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepf %v24, 0(%r2)
165*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
166*9880d681SAndroid Build Coastguard Worker  %scalar = load float, float *%ptr
167*9880d681SAndroid Build Coastguard Worker  %val = insertelement <4 x float> undef, float %scalar, i32 0
168*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <4 x float> %val, <4 x float> undef,
169*9880d681SAndroid Build Coastguard Worker                       <4 x i32> zeroinitializer
170*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %ret
171*9880d681SAndroid Build Coastguard Worker}
172*9880d681SAndroid Build Coastguard Worker
173*9880d681SAndroid Build Coastguard Worker; Test a v4f32 replicating load with the maximum in-range offset.
174*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @f14(float *%base) {
175*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f14:
176*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepf %v24, 4092(%r2)
177*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
178*9880d681SAndroid Build Coastguard Worker  %ptr = getelementptr float, float *%base, i64 1023
179*9880d681SAndroid Build Coastguard Worker  %scalar = load float, float *%ptr
180*9880d681SAndroid Build Coastguard Worker  %val = insertelement <4 x float> undef, float %scalar, i32 0
181*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <4 x float> %val, <4 x float> undef,
182*9880d681SAndroid Build Coastguard Worker                       <4 x i32> zeroinitializer
183*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %ret
184*9880d681SAndroid Build Coastguard Worker}
185*9880d681SAndroid Build Coastguard Worker
186*9880d681SAndroid Build Coastguard Worker; Test a v4f32 replicating load with the first out-of-range offset.
187*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @f15(float *%base) {
188*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f15:
189*9880d681SAndroid Build Coastguard Worker; CHECK: aghi %r2, 4096
190*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepf %v24, 0(%r2)
191*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
192*9880d681SAndroid Build Coastguard Worker  %ptr = getelementptr float, float *%base, i64 1024
193*9880d681SAndroid Build Coastguard Worker  %scalar = load float, float *%ptr
194*9880d681SAndroid Build Coastguard Worker  %val = insertelement <4 x float> undef, float %scalar, i32 0
195*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <4 x float> %val, <4 x float> undef,
196*9880d681SAndroid Build Coastguard Worker                       <4 x i32> zeroinitializer
197*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %ret
198*9880d681SAndroid Build Coastguard Worker}
199*9880d681SAndroid Build Coastguard Worker
200*9880d681SAndroid Build Coastguard Worker; Test a v2f64 replicating load with no offset.
201*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @f16(double *%ptr) {
202*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f16:
203*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepg %v24, 0(%r2)
204*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
205*9880d681SAndroid Build Coastguard Worker  %scalar = load double, double *%ptr
206*9880d681SAndroid Build Coastguard Worker  %val = insertelement <2 x double> undef, double %scalar, i32 0
207*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <2 x double> %val, <2 x double> undef,
208*9880d681SAndroid Build Coastguard Worker                       <2 x i32> zeroinitializer
209*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %ret
210*9880d681SAndroid Build Coastguard Worker}
211*9880d681SAndroid Build Coastguard Worker
212*9880d681SAndroid Build Coastguard Worker; Test a v2f64 replicating load with the maximum in-range offset.
213*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @f17(double *%base) {
214*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f17:
215*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepg %v24, 4088(%r2)
216*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
217*9880d681SAndroid Build Coastguard Worker  %ptr = getelementptr double, double *%base, i32 511
218*9880d681SAndroid Build Coastguard Worker  %scalar = load double, double *%ptr
219*9880d681SAndroid Build Coastguard Worker  %val = insertelement <2 x double> undef, double %scalar, i32 0
220*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <2 x double> %val, <2 x double> undef,
221*9880d681SAndroid Build Coastguard Worker                       <2 x i32> zeroinitializer
222*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %ret
223*9880d681SAndroid Build Coastguard Worker}
224*9880d681SAndroid Build Coastguard Worker
225*9880d681SAndroid Build Coastguard Worker; Test a v2f64 replicating load with the first out-of-range offset.
226*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @f18(double *%base) {
227*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f18:
228*9880d681SAndroid Build Coastguard Worker; CHECK: aghi %r2, 4096
229*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepg %v24, 0(%r2)
230*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
231*9880d681SAndroid Build Coastguard Worker  %ptr = getelementptr double, double *%base, i32 512
232*9880d681SAndroid Build Coastguard Worker  %scalar = load double, double *%ptr
233*9880d681SAndroid Build Coastguard Worker  %val = insertelement <2 x double> undef, double %scalar, i32 0
234*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <2 x double> %val, <2 x double> undef,
235*9880d681SAndroid Build Coastguard Worker                       <2 x i32> zeroinitializer
236*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %ret
237*9880d681SAndroid Build Coastguard Worker}
238*9880d681SAndroid Build Coastguard Worker
239*9880d681SAndroid Build Coastguard Worker; Test a v16i8 replicating load with an index.
240*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @f19(i8 *%base, i64 %index) {
241*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f19:
242*9880d681SAndroid Build Coastguard Worker; CHECK: vlrepb %v24, 1023(%r3,%r2)
243*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
244*9880d681SAndroid Build Coastguard Worker  %ptr1 = getelementptr i8, i8 *%base, i64 %index
245*9880d681SAndroid Build Coastguard Worker  %ptr = getelementptr i8, i8 *%ptr1, i64 1023
246*9880d681SAndroid Build Coastguard Worker  %scalar = load i8, i8 *%ptr
247*9880d681SAndroid Build Coastguard Worker  %val = insertelement <16 x i8> undef, i8 %scalar, i32 0
248*9880d681SAndroid Build Coastguard Worker  %ret = shufflevector <16 x i8> %val, <16 x i8> undef,
249*9880d681SAndroid Build Coastguard Worker                       <16 x i32> zeroinitializer
250*9880d681SAndroid Build Coastguard Worker  ret <16 x i8> %ret
251*9880d681SAndroid Build Coastguard Worker}
252