xref: /aosp_15_r20/external/clang/test/CodeGen/x86_64-arguments.c (revision 67e74705e28f6214e480b399dd47ea732279e315)
1*67e74705SXin Li // RUN: %clang_cc1 -triple x86_64-unknown-unknown -emit-llvm -o - %s | \
2*67e74705SXin Li // RUN:   FileCheck %s -check-prefix=CHECK -check-prefix=SSE -check-prefix=NO-AVX512
3*67e74705SXin Li // RUN: %clang_cc1 -triple x86_64-unknown-unknown -emit-llvm -o - %s -target-feature +avx | \
4*67e74705SXin Li // RUN:   FileCheck %s -check-prefix=CHECK -check-prefix=AVX -check-prefix=NO-AVX512
5*67e74705SXin Li // RUN: %clang_cc1 -triple x86_64-unknown-unknown -emit-llvm -o - %s -target-feature +avx512f | \
6*67e74705SXin Li // RUN:   FileCheck %s -check-prefix=CHECK -check-prefix=AVX -check-prefix=AVX512
7*67e74705SXin Li #include <stdarg.h>
8*67e74705SXin Li 
9*67e74705SXin Li // CHECK-LABEL: define signext i8 @f0()
f0(void)10*67e74705SXin Li char f0(void) {
11*67e74705SXin Li   return 0;
12*67e74705SXin Li }
13*67e74705SXin Li 
14*67e74705SXin Li // CHECK-LABEL: define signext i16 @f1()
f1(void)15*67e74705SXin Li short f1(void) {
16*67e74705SXin Li   return 0;
17*67e74705SXin Li }
18*67e74705SXin Li 
19*67e74705SXin Li // CHECK-LABEL: define i32 @f2()
f2(void)20*67e74705SXin Li int f2(void) {
21*67e74705SXin Li   return 0;
22*67e74705SXin Li }
23*67e74705SXin Li 
24*67e74705SXin Li // CHECK-LABEL: define float @f3()
f3(void)25*67e74705SXin Li float f3(void) {
26*67e74705SXin Li   return 0;
27*67e74705SXin Li }
28*67e74705SXin Li 
29*67e74705SXin Li // CHECK-LABEL: define double @f4()
f4(void)30*67e74705SXin Li double f4(void) {
31*67e74705SXin Li   return 0;
32*67e74705SXin Li }
33*67e74705SXin Li 
34*67e74705SXin Li // CHECK-LABEL: define x86_fp80 @f5()
f5(void)35*67e74705SXin Li long double f5(void) {
36*67e74705SXin Li   return 0;
37*67e74705SXin Li }
38*67e74705SXin Li 
39*67e74705SXin Li // CHECK-LABEL: define void @f6(i8 signext %a0, i16 signext %a1, i32 %a2, i64 %a3, i8* %a4)
f6(char a0,short a1,int a2,long long a3,void * a4)40*67e74705SXin Li void f6(char a0, short a1, int a2, long long a3, void *a4) {
41*67e74705SXin Li }
42*67e74705SXin Li 
43*67e74705SXin Li // CHECK-LABEL: define void @f7(i32 %a0)
44*67e74705SXin Li typedef enum { A, B, C } e7;
f7(e7 a0)45*67e74705SXin Li void f7(e7 a0) {
46*67e74705SXin Li }
47*67e74705SXin Li 
48*67e74705SXin Li // Test merging/passing of upper eightbyte with X87 class.
49*67e74705SXin Li //
50*67e74705SXin Li // CHECK-LABEL: define void @f8_1(%union.u8* noalias sret %agg.result)
51*67e74705SXin Li // CHECK-LABEL: define void @f8_2(%union.u8* byval align 16 %a0)
52*67e74705SXin Li union u8 {
53*67e74705SXin Li   long double a;
54*67e74705SXin Li   int b;
55*67e74705SXin Li };
f8_1()56*67e74705SXin Li union u8 f8_1() { while (1) {} }
f8_2(union u8 a0)57*67e74705SXin Li void f8_2(union u8 a0) {}
58*67e74705SXin Li 
59*67e74705SXin Li // CHECK-LABEL: define i64 @f9()
f9(void)60*67e74705SXin Li struct s9 { int a; int b; int : 0; } f9(void) { while (1) {} }
61*67e74705SXin Li 
62*67e74705SXin Li // CHECK-LABEL: define void @f10(i64 %a0.coerce)
63*67e74705SXin Li struct s10 { int a; int b; int : 0; };
f10(struct s10 a0)64*67e74705SXin Li void f10(struct s10 a0) {}
65*67e74705SXin Li 
66*67e74705SXin Li // CHECK-LABEL: define void @f11(%union.anon* noalias sret %agg.result)
f11()67*67e74705SXin Li union { long double a; float b; } f11() { while (1) {} }
68*67e74705SXin Li 
69*67e74705SXin Li // CHECK-LABEL: define i32 @f12_0()
70*67e74705SXin Li // CHECK-LABEL: define void @f12_1(i32 %a0.coerce)
71*67e74705SXin Li struct s12 { int a __attribute__((aligned(16))); };
f12_0(void)72*67e74705SXin Li struct s12 f12_0(void) { while (1) {} }
f12_1(struct s12 a0)73*67e74705SXin Li void f12_1(struct s12 a0) {}
74*67e74705SXin Li 
75*67e74705SXin Li // Check that sret parameter is accounted for when checking available integer
76*67e74705SXin Li // registers.
77*67e74705SXin Li // CHECK: define void @f13(%struct.s13_0* noalias sret %agg.result, i32 %a, i32 %b, i32 %c, i32 %d, {{.*}}* byval align 8 %e, i32 %f)
78*67e74705SXin Li 
79*67e74705SXin Li struct s13_0 { long long f0[3]; };
80*67e74705SXin Li struct s13_1 { long long f0[2]; };
f13(int a,int b,int c,int d,struct s13_1 e,int f)81*67e74705SXin Li struct s13_0 f13(int a, int b, int c, int d,
82*67e74705SXin Li                  struct s13_1 e, int f) { while (1) {} }
83*67e74705SXin Li 
84*67e74705SXin Li // CHECK: define void @f14({{.*}}, i8 signext %X)
f14(int a,int b,int c,int d,int e,int f,char X)85*67e74705SXin Li void f14(int a, int b, int c, int d, int e, int f, char X) {}
86*67e74705SXin Li 
87*67e74705SXin Li // CHECK: define void @f15({{.*}}, i8* %X)
f15(int a,int b,int c,int d,int e,int f,void * X)88*67e74705SXin Li void f15(int a, int b, int c, int d, int e, int f, void *X) {}
89*67e74705SXin Li 
90*67e74705SXin Li // CHECK: define void @f16({{.*}}, float %X)
f16(float a,float b,float c,float d,float e,float f,float g,float h,float X)91*67e74705SXin Li void f16(float a, float b, float c, float d, float e, float f, float g, float h,
92*67e74705SXin Li          float X) {}
93*67e74705SXin Li 
94*67e74705SXin Li // CHECK: define void @f17({{.*}}, x86_fp80 %X)
f17(float a,float b,float c,float d,float e,float f,float g,float h,long double X)95*67e74705SXin Li void f17(float a, float b, float c, float d, float e, float f, float g, float h,
96*67e74705SXin Li          long double X) {}
97*67e74705SXin Li 
98*67e74705SXin Li // Check for valid coercion.  The struct should be passed/returned as i32, not
99*67e74705SXin Li // as i64 for better code quality.
100*67e74705SXin Li // rdar://8135035
101*67e74705SXin Li // CHECK-LABEL: define void @f18(i32 %a, i32 %f18_arg1.coerce)
102*67e74705SXin Li struct f18_s0 { int f0; };
f18(int a,struct f18_s0 f18_arg1)103*67e74705SXin Li void f18(int a, struct f18_s0 f18_arg1) { while (1) {} }
104*67e74705SXin Li 
105*67e74705SXin Li // Check byval alignment.
106*67e74705SXin Li 
107*67e74705SXin Li // CHECK-LABEL: define void @f19(%struct.s19* byval align 16 %x)
108*67e74705SXin Li struct s19 {
109*67e74705SXin Li   long double a;
110*67e74705SXin Li };
f19(struct s19 x)111*67e74705SXin Li void f19(struct s19 x) {}
112*67e74705SXin Li 
113*67e74705SXin Li // CHECK-LABEL: define void @f20(%struct.s20* byval align 32 %x)
114*67e74705SXin Li struct __attribute__((aligned(32))) s20 {
115*67e74705SXin Li   int x;
116*67e74705SXin Li   int y;
117*67e74705SXin Li };
f20(struct s20 x)118*67e74705SXin Li void f20(struct s20 x) {}
119*67e74705SXin Li 
120*67e74705SXin Li struct StringRef {
121*67e74705SXin Li   long x;
122*67e74705SXin Li   const char *Ptr;
123*67e74705SXin Li };
124*67e74705SXin Li 
125*67e74705SXin Li // rdar://7375902
126*67e74705SXin Li // CHECK-LABEL: define i8* @f21(i64 %S.coerce0, i8* %S.coerce1)
f21(struct StringRef S)127*67e74705SXin Li const char *f21(struct StringRef S) { return S.x+S.Ptr; }
128*67e74705SXin Li 
129*67e74705SXin Li // PR7567
130*67e74705SXin Li typedef __attribute__ ((aligned(16))) struct f22s { unsigned long long x[2]; } L;
f22(L x,L y)131*67e74705SXin Li void f22(L x, L y) { }
132*67e74705SXin Li // CHECK: @f22
133*67e74705SXin Li // CHECK: %x = alloca{{.*}}, align 16
134*67e74705SXin Li // CHECK: %y = alloca{{.*}}, align 16
135*67e74705SXin Li 
136*67e74705SXin Li 
137*67e74705SXin Li 
138*67e74705SXin Li // PR7714
139*67e74705SXin Li struct f23S {
140*67e74705SXin Li   short f0;
141*67e74705SXin Li   unsigned f1;
142*67e74705SXin Li   int f2;
143*67e74705SXin Li };
144*67e74705SXin Li 
145*67e74705SXin Li 
f23(int A,struct f23S B)146*67e74705SXin Li void f23(int A, struct f23S B) {
147*67e74705SXin Li   // CHECK-LABEL: define void @f23(i32 %A, i64 %B.coerce0, i32 %B.coerce1)
148*67e74705SXin Li }
149*67e74705SXin Li 
150*67e74705SXin Li struct f24s { long a; int b; };
151*67e74705SXin Li 
f24(struct f23S * X,struct f24s * P2)152*67e74705SXin Li struct f23S f24(struct f23S *X, struct f24s *P2) {
153*67e74705SXin Li   return *X;
154*67e74705SXin Li 
155*67e74705SXin Li   // CHECK: define { i64, i32 } @f24(%struct.f23S* %X, %struct.f24s* %P2)
156*67e74705SXin Li }
157*67e74705SXin Li 
158*67e74705SXin Li // rdar://8248065
159*67e74705SXin Li typedef float v4f32 __attribute__((__vector_size__(16)));
f25(v4f32 X)160*67e74705SXin Li v4f32 f25(v4f32 X) {
161*67e74705SXin Li   // CHECK-LABEL: define <4 x float> @f25(<4 x float> %X)
162*67e74705SXin Li   // CHECK-NOT: alloca
163*67e74705SXin Li   // CHECK: alloca <4 x float>
164*67e74705SXin Li   // CHECK-NOT: alloca
165*67e74705SXin Li   // CHECK: store <4 x float> %X, <4 x float>*
166*67e74705SXin Li   // CHECK-NOT: store
167*67e74705SXin Li   // CHECK: ret <4 x float>
168*67e74705SXin Li   return X+X;
169*67e74705SXin Li }
170*67e74705SXin Li 
171*67e74705SXin Li struct foo26 {
172*67e74705SXin Li   int *X;
173*67e74705SXin Li   float *Y;
174*67e74705SXin Li };
175*67e74705SXin Li 
f26(struct foo26 * P)176*67e74705SXin Li struct foo26 f26(struct foo26 *P) {
177*67e74705SXin Li   // CHECK: define { i32*, float* } @f26(%struct.foo26* %P)
178*67e74705SXin Li   return *P;
179*67e74705SXin Li }
180*67e74705SXin Li 
181*67e74705SXin Li 
182*67e74705SXin Li struct v4f32wrapper {
183*67e74705SXin Li   v4f32 v;
184*67e74705SXin Li };
185*67e74705SXin Li 
f27(struct v4f32wrapper X)186*67e74705SXin Li struct v4f32wrapper f27(struct v4f32wrapper X) {
187*67e74705SXin Li   // CHECK-LABEL: define <4 x float> @f27(<4 x float> %X.coerce)
188*67e74705SXin Li   return X;
189*67e74705SXin Li }
190*67e74705SXin Li 
191*67e74705SXin Li // PR22563 - We should unwrap simple structs and arrays to pass
192*67e74705SXin Li // and return them in the appropriate vector registers if possible.
193*67e74705SXin Li 
194*67e74705SXin Li typedef float v8f32 __attribute__((__vector_size__(32)));
195*67e74705SXin Li struct v8f32wrapper {
196*67e74705SXin Li   v8f32 v;
197*67e74705SXin Li };
198*67e74705SXin Li 
f27a(struct v8f32wrapper X)199*67e74705SXin Li struct v8f32wrapper f27a(struct v8f32wrapper X) {
200*67e74705SXin Li   // AVX-LABEL: define <8 x float> @f27a(<8 x float> %X.coerce)
201*67e74705SXin Li   return X;
202*67e74705SXin Li }
203*67e74705SXin Li 
204*67e74705SXin Li struct v8f32wrapper_wrapper {
205*67e74705SXin Li   v8f32 v[1];
206*67e74705SXin Li };
207*67e74705SXin Li 
f27b(struct v8f32wrapper_wrapper X)208*67e74705SXin Li struct v8f32wrapper_wrapper f27b(struct v8f32wrapper_wrapper X) {
209*67e74705SXin Li   // AVX-LABEL: define <8 x float> @f27b(<8 x float> %X.coerce)
210*67e74705SXin Li   return X;
211*67e74705SXin Li }
212*67e74705SXin Li 
213*67e74705SXin Li // rdar://5711709
214*67e74705SXin Li struct f28c {
215*67e74705SXin Li   double x;
216*67e74705SXin Li   int y;
217*67e74705SXin Li };
f28(struct f28c C)218*67e74705SXin Li void f28(struct f28c C) {
219*67e74705SXin Li   // CHECK-LABEL: define void @f28(double %C.coerce0, i32 %C.coerce1)
220*67e74705SXin Li }
221*67e74705SXin Li 
222*67e74705SXin Li struct f29a {
223*67e74705SXin Li   struct c {
224*67e74705SXin Li     double x;
225*67e74705SXin Li     int y;
226*67e74705SXin Li   } x[1];
227*67e74705SXin Li };
228*67e74705SXin Li 
f29a(struct f29a A)229*67e74705SXin Li void f29a(struct f29a A) {
230*67e74705SXin Li   // CHECK-LABEL: define void @f29a(double %A.coerce0, i32 %A.coerce1)
231*67e74705SXin Li }
232*67e74705SXin Li 
233*67e74705SXin Li // rdar://8249586
234*67e74705SXin Li struct S0 { char f0[8]; char f2; char f3; char f4; };
f30(struct S0 p_4)235*67e74705SXin Li void f30(struct S0 p_4) {
236*67e74705SXin Li   // CHECK-LABEL: define void @f30(i64 %p_4.coerce0, i24 %p_4.coerce1)
237*67e74705SXin Li }
238*67e74705SXin Li 
239*67e74705SXin Li // Pass the third element as a float when followed by tail padding.
240*67e74705SXin Li // rdar://8251384
241*67e74705SXin Li struct f31foo { float a, b, c; };
f31(struct f31foo X)242*67e74705SXin Li float f31(struct f31foo X) {
243*67e74705SXin Li   // CHECK-LABEL: define float @f31(<2 x float> %X.coerce0, float %X.coerce1)
244*67e74705SXin Li   return X.c;
245*67e74705SXin Li }
246*67e74705SXin Li 
f32(_Complex float A,_Complex float B)247*67e74705SXin Li _Complex float f32(_Complex float A, _Complex float B) {
248*67e74705SXin Li   // rdar://6379669
249*67e74705SXin Li   // CHECK-LABEL: define <2 x float> @f32(<2 x float> %A.coerce, <2 x float> %B.coerce)
250*67e74705SXin Li   return A+B;
251*67e74705SXin Li }
252*67e74705SXin Li 
253*67e74705SXin Li 
254*67e74705SXin Li // rdar://8357396
255*67e74705SXin Li struct f33s { long x; float c,d; };
256*67e74705SXin Li 
f33(va_list X)257*67e74705SXin Li void f33(va_list X) {
258*67e74705SXin Li   va_arg(X, struct f33s);
259*67e74705SXin Li }
260*67e74705SXin Li 
261*67e74705SXin Li typedef unsigned long long v1i64 __attribute__((__vector_size__(8)));
262*67e74705SXin Li 
263*67e74705SXin Li // rdar://8359248
264*67e74705SXin Li // CHECK-LABEL: define double @f34(double %arg.coerce)
f34(v1i64 arg)265*67e74705SXin Li v1i64 f34(v1i64 arg) { return arg; }
266*67e74705SXin Li 
267*67e74705SXin Li 
268*67e74705SXin Li // rdar://8358475
269*67e74705SXin Li // CHECK-LABEL: define double @f35(double %arg.coerce)
270*67e74705SXin Li typedef unsigned long v1i64_2 __attribute__((__vector_size__(8)));
f35(v1i64_2 arg)271*67e74705SXin Li v1i64_2 f35(v1i64_2 arg) { return arg+arg; }
272*67e74705SXin Li 
273*67e74705SXin Li // rdar://9122143
274*67e74705SXin Li // CHECK: declare void @func(%struct._str* byval align 16)
275*67e74705SXin Li typedef struct _str {
276*67e74705SXin Li   union {
277*67e74705SXin Li     long double a;
278*67e74705SXin Li     long c;
279*67e74705SXin Li   };
280*67e74705SXin Li } str;
281*67e74705SXin Li 
282*67e74705SXin Li void func(str s);
283*67e74705SXin Li str ss;
f9122143()284*67e74705SXin Li void f9122143()
285*67e74705SXin Li {
286*67e74705SXin Li   func(ss);
287*67e74705SXin Li }
288*67e74705SXin Li 
289*67e74705SXin Li // CHECK-LABEL: define double @f36(double %arg.coerce)
290*67e74705SXin Li typedef unsigned v2i32 __attribute((__vector_size__(8)));
f36(v2i32 arg)291*67e74705SXin Li v2i32 f36(v2i32 arg) { return arg; }
292*67e74705SXin Li 
293*67e74705SXin Li // AVX: declare void @f38(<8 x float>)
294*67e74705SXin Li // AVX: declare void @f37(<8 x float>)
295*67e74705SXin Li // SSE: declare void @f38(%struct.s256* byval align 32)
296*67e74705SXin Li // SSE: declare void @f37(<8 x float>* byval align 32)
297*67e74705SXin Li typedef float __m256 __attribute__ ((__vector_size__ (32)));
298*67e74705SXin Li typedef struct {
299*67e74705SXin Li   __m256 m;
300*67e74705SXin Li } s256;
301*67e74705SXin Li 
302*67e74705SXin Li s256 x38;
303*67e74705SXin Li __m256 x37;
304*67e74705SXin Li 
305*67e74705SXin Li void f38(s256 x);
306*67e74705SXin Li void f37(__m256 x);
f39()307*67e74705SXin Li void f39() { f38(x38); f37(x37); }
308*67e74705SXin Li 
309*67e74705SXin Li // The two next tests make sure that the struct below is passed
310*67e74705SXin Li // in the same way regardless of avx being used
311*67e74705SXin Li 
312*67e74705SXin Li // CHECK: declare void @func40(%struct.t128* byval align 16)
313*67e74705SXin Li typedef float __m128 __attribute__ ((__vector_size__ (16)));
314*67e74705SXin Li typedef struct t128 {
315*67e74705SXin Li   __m128 m;
316*67e74705SXin Li   __m128 n;
317*67e74705SXin Li } two128;
318*67e74705SXin Li 
319*67e74705SXin Li extern void func40(two128 s);
func41(two128 s)320*67e74705SXin Li void func41(two128 s) {
321*67e74705SXin Li   func40(s);
322*67e74705SXin Li }
323*67e74705SXin Li 
324*67e74705SXin Li // CHECK: declare void @func42(%struct.t128_2* byval align 16)
325*67e74705SXin Li typedef struct xxx {
326*67e74705SXin Li   __m128 array[2];
327*67e74705SXin Li } Atwo128;
328*67e74705SXin Li typedef struct t128_2 {
329*67e74705SXin Li   Atwo128 x;
330*67e74705SXin Li } SA;
331*67e74705SXin Li 
332*67e74705SXin Li extern void func42(SA s);
func43(SA s)333*67e74705SXin Li void func43(SA s) {
334*67e74705SXin Li   func42(s);
335*67e74705SXin Li }
336*67e74705SXin Li 
337*67e74705SXin Li // CHECK-LABEL: define i32 @f44
338*67e74705SXin Li // CHECK: ptrtoint
339*67e74705SXin Li // CHECK-NEXT: add i64 %{{[0-9]+}}, 31
340*67e74705SXin Li // CHECK-NEXT: and i64 %{{[0-9]+}}, -32
341*67e74705SXin Li // CHECK-NEXT: inttoptr
342*67e74705SXin Li typedef int T44 __attribute((vector_size(32)));
343*67e74705SXin Li struct s44 { T44 x; int y; };
f44(int i,...)344*67e74705SXin Li int f44(int i, ...) {
345*67e74705SXin Li   __builtin_va_list ap;
346*67e74705SXin Li   __builtin_va_start(ap, i);
347*67e74705SXin Li   struct s44 s = __builtin_va_arg(ap, struct s44);
348*67e74705SXin Li   __builtin_va_end(ap);
349*67e74705SXin Li   return s.y;
350*67e74705SXin Li }
351*67e74705SXin Li 
352*67e74705SXin Li // Text that vec3 returns the correct LLVM IR type.
353*67e74705SXin Li // AVX-LABEL: define i32 @foo(<3 x i64> %X)
354*67e74705SXin Li typedef long long3 __attribute((ext_vector_type(3)));
foo(long3 X)355*67e74705SXin Li int foo(long3 X)
356*67e74705SXin Li {
357*67e74705SXin Li   return 0;
358*67e74705SXin Li }
359*67e74705SXin Li 
360*67e74705SXin Li // Make sure we don't use a varargs convention for a function without a
361*67e74705SXin Li // prototype where AVX types are involved.
362*67e74705SXin Li // AVX: @test45
363*67e74705SXin Li // AVX: call i32 bitcast (i32 (...)* @f45 to i32 (<8 x float>)*)
364*67e74705SXin Li int f45();
365*67e74705SXin Li __m256 x45;
test45()366*67e74705SXin Li void test45() { f45(x45); }
367*67e74705SXin Li 
368*67e74705SXin Li // Make sure we use byval to pass 64-bit vectors in memory; the LLVM call
369*67e74705SXin Li // lowering can't handle this case correctly because it runs after legalization.
370*67e74705SXin Li // CHECK: @test46
371*67e74705SXin Li // CHECK: call void @f46({{.*}}<2 x float>* byval align 8 {{.*}}, <2 x float>* byval align 8 {{.*}})
372*67e74705SXin Li typedef float v46 __attribute((vector_size(8)));
373*67e74705SXin Li void f46(v46,v46,v46,v46,v46,v46,v46,v46,v46,v46);
test46()374*67e74705SXin Li void test46() { v46 x = {1,2}; f46(x,x,x,x,x,x,x,x,x,x); }
375*67e74705SXin Li 
376*67e74705SXin Li // Check that we pass the struct below without using byval, which helps out
377*67e74705SXin Li // codegen.
378*67e74705SXin Li //
379*67e74705SXin Li // CHECK: @test47
380*67e74705SXin Li // CHECK: call void @f47(i32 {{.*}}, i32 {{.*}}, i32 {{.*}}, i32 {{.*}}, i32 {{.*}}, i32 {{.*}}, i32 {{.*}})
381*67e74705SXin Li struct s47 { unsigned a; };
382*67e74705SXin Li void f47(int,int,int,int,int,int,struct s47);
test47(int a,struct s47 b)383*67e74705SXin Li void test47(int a, struct s47 b) { f47(a, a, a, a, a, a, b); }
384*67e74705SXin Li 
385*67e74705SXin Li // rdar://12723368
386*67e74705SXin Li // In the following example, there are holes in T4 at the 3rd byte and the 4th
387*67e74705SXin Li // byte, however, T2 does not have those holes. T4 is chosen to be the
388*67e74705SXin Li // representing type for union T1, but we can't use load or store of T4 since
389*67e74705SXin Li // it will skip the 3rd byte and the 4th byte.
390*67e74705SXin Li // In general, Since we don't accurately represent the data fields of a union,
391*67e74705SXin Li // do not use load or store of the representing llvm type for the union.
392*67e74705SXin Li typedef _Complex int T2;
393*67e74705SXin Li typedef _Complex char T5;
394*67e74705SXin Li typedef _Complex int T7;
395*67e74705SXin Li typedef struct T4 { T5 field0; T7 field1; } T4;
396*67e74705SXin Li typedef union T1 { T2 field0; T4 field1; } T1;
397*67e74705SXin Li extern T1 T1_retval;
test48(void)398*67e74705SXin Li T1 test48(void) {
399*67e74705SXin Li // CHECK: @test48
400*67e74705SXin Li // CHECK: memcpy
401*67e74705SXin Li // CHECK: memcpy
402*67e74705SXin Li   return T1_retval;
403*67e74705SXin Li }
404*67e74705SXin Li 
405*67e74705SXin Li void test49_helper(double, ...);
test49(double d,double e)406*67e74705SXin Li void test49(double d, double e) {
407*67e74705SXin Li   test49_helper(d, e);
408*67e74705SXin Li }
409*67e74705SXin Li // CHECK-LABEL:    define void @test49(
410*67e74705SXin Li // CHECK:      [[T0:%.*]] = load double, double*
411*67e74705SXin Li // CHECK-NEXT: [[T1:%.*]] = load double, double*
412*67e74705SXin Li // CHECK-NEXT: call void (double, ...) @test49_helper(double [[T0]], double [[T1]])
413*67e74705SXin Li 
414*67e74705SXin Li void test50_helper();
test50(double d,double e)415*67e74705SXin Li void test50(double d, double e) {
416*67e74705SXin Li   test50_helper(d, e);
417*67e74705SXin Li }
418*67e74705SXin Li // CHECK-LABEL:    define void @test50(
419*67e74705SXin Li // CHECK:      [[T0:%.*]] = load double, double*
420*67e74705SXin Li // CHECK-NEXT: [[T1:%.*]] = load double, double*
421*67e74705SXin Li // CHECK-NEXT: call void (double, double, ...) bitcast (void (...)* @test50_helper to void (double, double, ...)*)(double [[T0]], double [[T1]])
422*67e74705SXin Li 
423*67e74705SXin Li struct test51_s { __uint128_t intval; };
test51(struct test51_s * s,__builtin_va_list argList)424*67e74705SXin Li void test51(struct test51_s *s, __builtin_va_list argList) {
425*67e74705SXin Li     *s = __builtin_va_arg(argList, struct test51_s);
426*67e74705SXin Li }
427*67e74705SXin Li 
428*67e74705SXin Li // CHECK-LABEL: define void @test51
429*67e74705SXin Li // CHECK: [[TMP_ADDR:%.*]] = alloca [[STRUCT_TEST51:%.*]], align 16
430*67e74705SXin Li // CHECK: br i1
431*67e74705SXin Li // CHECK: [[REG_SAVE_AREA_PTR:%.*]] = getelementptr inbounds {{.*}}, i32 0, i32 3
432*67e74705SXin Li // CHECK-NEXT: [[REG_SAVE_AREA:%.*]] = load i8*, i8** [[REG_SAVE_AREA_PTR]]
433*67e74705SXin Li // CHECK-NEXT: [[VALUE_ADDR:%.*]] = getelementptr i8, i8* [[REG_SAVE_AREA]], i32 {{.*}}
434*67e74705SXin Li // CHECK-NEXT: [[CASTED_VALUE_ADDR:%.*]] = bitcast i8* [[VALUE_ADDR]] to [[STRUCT_TEST51]]
435*67e74705SXin Li // CHECK-NEXT: [[CASTED_TMP_ADDR:%.*]] = bitcast [[STRUCT_TEST51]]* [[TMP_ADDR]] to i8*
436*67e74705SXin Li // CHECK-NEXT: [[RECASTED_VALUE_ADDR:%.*]] = bitcast [[STRUCT_TEST51]]* [[CASTED_VALUE_ADDR]] to i8*
437*67e74705SXin Li // CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* [[CASTED_TMP_ADDR]], i8* [[RECASTED_VALUE_ADDR]], i64 16, i32 8, i1 false)
438*67e74705SXin Li // CHECK-NEXT: add i32 {{.*}}, 16
439*67e74705SXin Li // CHECK-NEXT: store i32 {{.*}}, i32* {{.*}}
440*67e74705SXin Li // CHECK-NEXT: br label
441*67e74705SXin Li 
442*67e74705SXin Li void test52_helper(int, ...);
443*67e74705SXin Li __m256 x52;
test52()444*67e74705SXin Li void test52() {
445*67e74705SXin Li   test52_helper(0, x52, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0i);
446*67e74705SXin Li }
447*67e74705SXin Li // AVX: @test52_helper(i32 0, <8 x float> {{%[a-zA-Z0-9]+}}, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double {{%[a-zA-Z0-9]+}}, double {{%[a-zA-Z0-9]+}})
448*67e74705SXin Li 
test53(__m256 * m,__builtin_va_list argList)449*67e74705SXin Li void test53(__m256 *m, __builtin_va_list argList) {
450*67e74705SXin Li   *m = __builtin_va_arg(argList, __m256);
451*67e74705SXin Li }
452*67e74705SXin Li // AVX-LABEL: define void @test53
453*67e74705SXin Li // AVX-NOT: br i1
454*67e74705SXin Li // AVX: ret void
455*67e74705SXin Li 
456*67e74705SXin Li void test54_helper(__m256, ...);
457*67e74705SXin Li __m256 x54;
test54()458*67e74705SXin Li void test54() {
459*67e74705SXin Li   test54_helper(x54, x54, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0i);
460*67e74705SXin Li   test54_helper(x54, x54, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0i);
461*67e74705SXin Li }
462*67e74705SXin Li // AVX: @test54_helper(<8 x float> {{%[a-zA-Z0-9]+}}, <8 x float> {{%[a-zA-Z0-9]+}}, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double {{%[a-zA-Z0-9]+}}, double {{%[a-zA-Z0-9]+}})
463*67e74705SXin Li // AVX: @test54_helper(<8 x float> {{%[a-zA-Z0-9]+}}, <8 x float> {{%[a-zA-Z0-9]+}}, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, { double, double }* byval align 8 {{%[a-zA-Z0-9]+}})
464*67e74705SXin Li 
465*67e74705SXin Li typedef float __m512 __attribute__ ((__vector_size__ (64)));
466*67e74705SXin Li typedef struct {
467*67e74705SXin Li   __m512 m;
468*67e74705SXin Li } s512;
469*67e74705SXin Li 
470*67e74705SXin Li s512 x55;
471*67e74705SXin Li __m512 x56;
472*67e74705SXin Li 
473*67e74705SXin Li // Even on AVX512, aggregates of size larger than four eightbytes have class
474*67e74705SXin Li // MEMORY (AVX512 draft 0.3 3.2.3p2 Rule 1).
475*67e74705SXin Li //
476*67e74705SXin Li // CHECK: declare void @f55(%struct.s512* byval align 64)
477*67e74705SXin Li void f55(s512 x);
478*67e74705SXin Li 
479*67e74705SXin Li // However, __m512 has type SSE/SSEUP on AVX512.
480*67e74705SXin Li //
481*67e74705SXin Li // AVX512: declare void @f56(<16 x float>)
482*67e74705SXin Li // NO-AVX512: declare void @f56(<16 x float>* byval align 64)
483*67e74705SXin Li void f56(__m512 x);
f57()484*67e74705SXin Li void f57() { f55(x55); f56(x56); }
485*67e74705SXin Li 
486*67e74705SXin Li // Like for __m128 on AVX, check that the struct below is passed
487*67e74705SXin Li // in the same way regardless of AVX512 being used.
488*67e74705SXin Li //
489*67e74705SXin Li // CHECK: declare void @f58(%struct.t256* byval align 32)
490*67e74705SXin Li typedef struct t256 {
491*67e74705SXin Li   __m256 m;
492*67e74705SXin Li   __m256 n;
493*67e74705SXin Li } two256;
494*67e74705SXin Li 
495*67e74705SXin Li extern void f58(two256 s);
f59(two256 s)496*67e74705SXin Li void f59(two256 s) {
497*67e74705SXin Li   f58(s);
498*67e74705SXin Li }
499*67e74705SXin Li 
500*67e74705SXin Li // CHECK: declare void @f60(%struct.sat256* byval align 32)
501*67e74705SXin Li typedef struct at256 {
502*67e74705SXin Li   __m256 array[2];
503*67e74705SXin Li } Atwo256;
504*67e74705SXin Li typedef struct sat256 {
505*67e74705SXin Li   Atwo256 x;
506*67e74705SXin Li } SAtwo256;
507*67e74705SXin Li 
508*67e74705SXin Li extern void f60(SAtwo256 s);
f61(SAtwo256 s)509*67e74705SXin Li void f61(SAtwo256 s) {
510*67e74705SXin Li   f60(s);
511*67e74705SXin Li }
512*67e74705SXin Li 
513*67e74705SXin Li // AVX512: @f62_helper(i32 0, <16 x float> {{%[a-zA-Z0-9]+}}, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double {{%[a-zA-Z0-9]+}}, double {{%[a-zA-Z0-9]+}})
514*67e74705SXin Li void f62_helper(int, ...);
515*67e74705SXin Li __m512 x62;
f62()516*67e74705SXin Li void f62() {
517*67e74705SXin Li   f62_helper(0, x62, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0i);
518*67e74705SXin Li }
519*67e74705SXin Li 
520*67e74705SXin Li // Like for __m256 on AVX, we always pass __m512 in memory, and don't
521*67e74705SXin Li // need to use the register save area.
522*67e74705SXin Li //
523*67e74705SXin Li // AVX512-LABEL: define void @f63
524*67e74705SXin Li // AVX512-NOT: br i1
525*67e74705SXin Li // AVX512: ret void
f63(__m512 * m,__builtin_va_list argList)526*67e74705SXin Li void f63(__m512 *m, __builtin_va_list argList) {
527*67e74705SXin Li   *m = __builtin_va_arg(argList, __m512);
528*67e74705SXin Li }
529*67e74705SXin Li 
530*67e74705SXin Li // AVX512: @f64_helper(<16 x float> {{%[a-zA-Z0-9]+}}, <16 x float> {{%[a-zA-Z0-9]+}}, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double {{%[a-zA-Z0-9]+}}, double {{%[a-zA-Z0-9]+}})
531*67e74705SXin Li // AVX512: @f64_helper(<16 x float> {{%[a-zA-Z0-9]+}}, <16 x float> {{%[a-zA-Z0-9]+}}, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, { double, double }* byval align 8 {{%[a-zA-Z0-9]+}})
532*67e74705SXin Li void f64_helper(__m512, ...);
533*67e74705SXin Li __m512 x64;
f64()534*67e74705SXin Li void f64() {
535*67e74705SXin Li   f64_helper(x64, x64, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0i);
536*67e74705SXin Li   f64_helper(x64, x64, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0i);
537*67e74705SXin Li }
538