xref: /aosp_15_r20/external/clang/test/OpenMP/taskloop_simd_codegen.cpp (revision 67e74705e28f6214e480b399dd47ea732279e315)
1*67e74705SXin Li // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck %s
2*67e74705SXin Li // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
3*67e74705SXin Li // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck %s
4*67e74705SXin Li // expected-no-diagnostics
5*67e74705SXin Li // REQUIRES: x86-registered-target
6*67e74705SXin Li #ifndef HEADER
7*67e74705SXin Li #define HEADER
8*67e74705SXin Li 
9*67e74705SXin Li // CHECK-LABEL: @main
main(int argc,char ** argv)10*67e74705SXin Li int main(int argc, char **argv) {
11*67e74705SXin Li // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%ident_t* [[DEFLOC:@.+]])
12*67e74705SXin Li // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%ident_t* [[DEFLOC]], i32 [[GTID]], i32 33, i64 72, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK1:@.+]] to i32 (i32, i8*)*))
13*67e74705SXin Li // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
14*67e74705SXin Li // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
15*67e74705SXin Li // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
16*67e74705SXin Li // CHECK: store i64 0, i64* [[DOWN]],
17*67e74705SXin Li // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
18*67e74705SXin Li // CHECK: store i64 9, i64* [[UP]],
19*67e74705SXin Li // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
20*67e74705SXin Li // CHECK: store i64 1, i64* [[ST]],
21*67e74705SXin Li // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
22*67e74705SXin Li // CHECK: call void @__kmpc_taskloop(%ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 0, i32 0, i64 0, i8* null)
23*67e74705SXin Li #pragma omp taskloop simd priority(argc)
24*67e74705SXin Li   for (int i = 0; i < 10; ++i)
25*67e74705SXin Li     ;
26*67e74705SXin Li // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 72, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK2:@.+]] to i32 (i32, i8*)*))
27*67e74705SXin Li // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
28*67e74705SXin Li // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
29*67e74705SXin Li // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
30*67e74705SXin Li // CHECK: store i64 0, i64* [[DOWN]],
31*67e74705SXin Li // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
32*67e74705SXin Li // CHECK: store i64 9, i64* [[UP]],
33*67e74705SXin Li // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
34*67e74705SXin Li // CHECK: store i64 1, i64* [[ST]],
35*67e74705SXin Li // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
36*67e74705SXin Li // CHECK: [[GRAINSIZE:%.+]] = zext i32 %{{.+}} to i64
37*67e74705SXin Li // CHECK: call void @__kmpc_taskloop(%ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 1, i64 [[GRAINSIZE]], i8* null)
38*67e74705SXin Li #pragma omp taskloop simd nogroup grainsize(argc) simdlen(4)
39*67e74705SXin Li   for (int i = 0; i < 10; ++i)
40*67e74705SXin Li     ;
41*67e74705SXin Li // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 72, i64 24, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK3:@.+]] to i32 (i32, i8*)*))
42*67e74705SXin Li // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
43*67e74705SXin Li // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
44*67e74705SXin Li // CHECK: [[IF:%.+]] = icmp ne i32 %{{.+}}, 0
45*67e74705SXin Li // CHECK: [[IF_INT:%.+]] = sext i1 [[IF]] to i32
46*67e74705SXin Li // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
47*67e74705SXin Li // CHECK: store i64 0, i64* [[DOWN]],
48*67e74705SXin Li // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
49*67e74705SXin Li // CHECK: store i64 %{{.+}}, i64* [[UP]],
50*67e74705SXin Li // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
51*67e74705SXin Li // CHECK: store i64 1, i64* [[ST]],
52*67e74705SXin Li // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
53*67e74705SXin Li // CHECK: call void @__kmpc_taskloop(%ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 [[IF_INT]], i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 0, i32 2, i64 4, i8* null)
54*67e74705SXin Li   int i;
55*67e74705SXin Li #pragma omp taskloop simd if(argc) shared(argc, argv) collapse(2) num_tasks(4) safelen(32)
56*67e74705SXin Li   for (i = 0; i < argc; ++i)
57*67e74705SXin Li   for (int j = argc; j < argv[argc][argc]; ++j)
58*67e74705SXin Li     ;
59*67e74705SXin Li }
60*67e74705SXin Li 
61*67e74705SXin Li // CHECK: define internal i32 [[TASK1]](
62*67e74705SXin Li // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
63*67e74705SXin Li // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
64*67e74705SXin Li // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
65*67e74705SXin Li // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
66*67e74705SXin Li // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
67*67e74705SXin Li // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
68*67e74705SXin Li // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
69*67e74705SXin Li // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
70*67e74705SXin Li // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
71*67e74705SXin Li // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
72*67e74705SXin Li // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
73*67e74705SXin Li // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
74*67e74705SXin Li // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
75*67e74705SXin Li // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
76*67e74705SXin Li // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
77*67e74705SXin Li // CHECK: br label
78*67e74705SXin Li // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],{{.*}}!llvm.mem.parallel_loop_access [[LOOP1:!.+]]
79*67e74705SXin Li // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
80*67e74705SXin Li // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],{{.*}}!llvm.mem.parallel_loop_access [[LOOP1]]
81*67e74705SXin Li // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
82*67e74705SXin Li // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
83*67e74705SXin Li // CHECK: load i32, i32* %{{.*}}!llvm.mem.parallel_loop_access [[LOOP1]]
84*67e74705SXin Li // CHECK: store i32 %{{.*}}!llvm.mem.parallel_loop_access [[LOOP1]]
85*67e74705SXin Li // CHECK: load i32, i32* %{{.*}}!llvm.mem.parallel_loop_access [[LOOP1]]
86*67e74705SXin Li // CHECK: add nsw i32 %{{.+}}, 1
87*67e74705SXin Li // CHECK: store i32 %{{.+}}, i32* %{{.*}}!llvm.mem.parallel_loop_access [[LOOP1]]
88*67e74705SXin Li // CHECK: br label %{{.*}}!llvm.loop [[LOOP1]]
89*67e74705SXin Li // CHECK: ret i32 0
90*67e74705SXin Li 
91*67e74705SXin Li // CHECK: define internal i32 [[TASK2]](
92*67e74705SXin Li // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
93*67e74705SXin Li // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
94*67e74705SXin Li // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
95*67e74705SXin Li // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
96*67e74705SXin Li // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
97*67e74705SXin Li // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
98*67e74705SXin Li // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
99*67e74705SXin Li // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
100*67e74705SXin Li // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
101*67e74705SXin Li // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
102*67e74705SXin Li // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
103*67e74705SXin Li // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
104*67e74705SXin Li // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
105*67e74705SXin Li // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
106*67e74705SXin Li // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
107*67e74705SXin Li // CHECK: br label
108*67e74705SXin Li // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],{{.*}}!llvm.mem.parallel_loop_access [[LOOP2:!.+]]
109*67e74705SXin Li // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
110*67e74705SXin Li // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],{{.*}}!llvm.mem.parallel_loop_access [[LOOP2]]
111*67e74705SXin Li // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
112*67e74705SXin Li // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
113*67e74705SXin Li // CHECK: load i32, i32* %{{.*}}!llvm.mem.parallel_loop_access [[LOOP2]]
114*67e74705SXin Li // CHECK: store i32 %{{.*}}!llvm.mem.parallel_loop_access [[LOOP2]]
115*67e74705SXin Li // CHECK: load i32, i32* %{{.*}}!llvm.mem.parallel_loop_access [[LOOP2]]
116*67e74705SXin Li // CHECK: add nsw i32 %{{.+}}, 1
117*67e74705SXin Li // CHECK: store i32 %{{.+}}, i32* %{{.*}}!llvm.mem.parallel_loop_access [[LOOP2]]
118*67e74705SXin Li // CHECK: br label %{{.*}}!llvm.loop [[LOOP2]]
119*67e74705SXin Li // CHECK: ret i32 0
120*67e74705SXin Li 
121*67e74705SXin Li // CHECK: define internal i32 [[TASK3]](
122*67e74705SXin Li // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
123*67e74705SXin Li // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
124*67e74705SXin Li // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
125*67e74705SXin Li // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
126*67e74705SXin Li // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
127*67e74705SXin Li // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
128*67e74705SXin Li // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
129*67e74705SXin Li // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
130*67e74705SXin Li // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
131*67e74705SXin Li // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
132*67e74705SXin Li // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
133*67e74705SXin Li // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
134*67e74705SXin Li // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
135*67e74705SXin Li // CHECK: store i64 [[LB_VAL]], i64* [[CNT:%.+]],
136*67e74705SXin Li // CHECK: br label
137*67e74705SXin Li // CHECK-NOT: !llvm.mem.parallel_loop_access
138*67e74705SXin Li // CHECK: br label %{{.*}}!llvm.loop
139*67e74705SXin Li // CHECK: ret i32 0
140*67e74705SXin Li 
141*67e74705SXin Li // CHECK-LABEL: @_ZN1SC2Ei
142*67e74705SXin Li struct S {
143*67e74705SXin Li   int a;
SS144*67e74705SXin Li   S(int c) {
145*67e74705SXin Li // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%ident_t* [[DEFLOC:@.+]])
146*67e74705SXin Li // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 72, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK4:@.+]] to i32 (i32, i8*)*))
147*67e74705SXin Li // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
148*67e74705SXin Li // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
149*67e74705SXin Li // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
150*67e74705SXin Li // CHECK: store i64 0, i64* [[DOWN]],
151*67e74705SXin Li // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
152*67e74705SXin Li // CHECK: store i64 %{{.+}}, i64* [[UP]],
153*67e74705SXin Li // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
154*67e74705SXin Li // CHECK: store i64 1, i64* [[ST]],
155*67e74705SXin Li // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
156*67e74705SXin Li // CHECK: [[NUM_TASKS:%.+]] = zext i32 %{{.+}} to i64
157*67e74705SXin Li // CHECK: call void @__kmpc_taskloop(%ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 0, i32 2, i64 [[NUM_TASKS]], i8* null)
158*67e74705SXin Li #pragma omp taskloop simd shared(c) num_tasks(a) simdlen(64) safelen(8)
159*67e74705SXin Li     for (a = 0; a < c; ++a)
160*67e74705SXin Li       ;
161*67e74705SXin Li   }
162*67e74705SXin Li } s(1);
163*67e74705SXin Li 
164*67e74705SXin Li // CHECK: define internal i32 [[TASK4]](
165*67e74705SXin Li // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
166*67e74705SXin Li // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
167*67e74705SXin Li // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
168*67e74705SXin Li // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
169*67e74705SXin Li // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
170*67e74705SXin Li // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
171*67e74705SXin Li // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
172*67e74705SXin Li // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
173*67e74705SXin Li // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
174*67e74705SXin Li // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
175*67e74705SXin Li // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
176*67e74705SXin Li // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
177*67e74705SXin Li // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
178*67e74705SXin Li // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
179*67e74705SXin Li // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
180*67e74705SXin Li // CHECK: br label
181*67e74705SXin Li // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
182*67e74705SXin Li // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
183*67e74705SXin Li // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
184*67e74705SXin Li // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
185*67e74705SXin Li // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
186*67e74705SXin Li // CHECK: load i32, i32* %
187*67e74705SXin Li // CHECK-NOT: !llvm.mem.parallel_loop_access
188*67e74705SXin Li // CHECK: store i32 %
189*67e74705SXin Li // CHECK-NOT: !llvm.mem.parallel_loop_access
190*67e74705SXin Li // CHECK: load i32, i32* %
191*67e74705SXin Li // CHECK-NOT: !llvm.mem.parallel_loop_access
192*67e74705SXin Li // CHECK: add nsw i32 %{{.+}}, 1
193*67e74705SXin Li // CHECK: store i32 %{{.+}}, i32* %
194*67e74705SXin Li // CHECK-NOT: !llvm.mem.parallel_loop_access
195*67e74705SXin Li // CHECK: br label %{{.*}}!llvm.loop
196*67e74705SXin Li // CHECK: ret i32 0
197*67e74705SXin Li 
198*67e74705SXin Li // CHECK: !{!"llvm.loop.vectorize.enable", i1 true}
199*67e74705SXin Li // CHECK: !{!"llvm.loop.vectorize.width", i32 4}
200*67e74705SXin Li // CHECK: !{!"llvm.loop.vectorize.width", i32 32}
201*67e74705SXin Li // CHECK: !{!"llvm.loop.vectorize.width", i32 64}
202*67e74705SXin Li 
203*67e74705SXin Li #endif
204