1*9880d681SAndroid Build Coastguard Worker; RUN: llc -O3 -march=hexagon -mcpu=hexagonv5 < %s | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker; 3*9880d681SAndroid Build Coastguard Worker; Generate hardware loop when unknown trip count loop is vectorized. 4*9880d681SAndroid Build Coastguard Worker 5*9880d681SAndroid Build Coastguard Worker; CHECK: loop0(.LBB{{[0-9]*}}_{{[0-9]*}}, r{{[0-9]+}}) 6*9880d681SAndroid Build Coastguard Worker; CHECK: endloop0 7*9880d681SAndroid Build Coastguard Worker; CHECK: loop0(.LBB{{[0-9]*}}_{{[0-9]*}}, r{{[0-9]+}}) 8*9880d681SAndroid Build Coastguard Worker; CHECK: endloop0 9*9880d681SAndroid Build Coastguard Worker 10*9880d681SAndroid Build Coastguard Worker@A = common global [1000 x i32] zeroinitializer, align 8 11*9880d681SAndroid Build Coastguard Worker@B = common global [1000 x i32] zeroinitializer, align 8 12*9880d681SAndroid Build Coastguard Worker 13*9880d681SAndroid Build Coastguard Workerdefine i32 @dotprod2(i32 %count) #0 { 14*9880d681SAndroid Build Coastguard Workerentry.split: 15*9880d681SAndroid Build Coastguard Worker %cmp6 = icmp sgt i32 %count, 0 16*9880d681SAndroid Build Coastguard Worker br i1 %cmp6, label %polly.cond, label %for.end 17*9880d681SAndroid Build Coastguard Worker 18*9880d681SAndroid Build Coastguard Workerfor.end.loopexit: 19*9880d681SAndroid Build Coastguard Worker br label %for.end 20*9880d681SAndroid Build Coastguard Worker 21*9880d681SAndroid Build Coastguard Workerfor.end: 22*9880d681SAndroid Build Coastguard Worker %sum.0.lcssa.reg2mem.0.load37 = phi i32 [ 0, %entry.split ], [ %p_add34, %polly.loop_if13 ], [ %p_add, %for.end.loopexit ] 23*9880d681SAndroid Build Coastguard Worker ret i32 %sum.0.lcssa.reg2mem.0.load37 24*9880d681SAndroid Build Coastguard Worker 25*9880d681SAndroid Build Coastguard Workerpolly.cond: 26*9880d681SAndroid Build Coastguard Worker %0 = icmp sgt i32 %count, 1 27*9880d681SAndroid Build Coastguard Worker br i1 %0, label %polly.loop_if, label %polly.loop_if13 28*9880d681SAndroid Build Coastguard Worker 29*9880d681SAndroid Build Coastguard Workerpolly.loop_exit.loopexit: 30*9880d681SAndroid Build Coastguard Worker br label %polly.loop_exit 31*9880d681SAndroid Build Coastguard Worker 32*9880d681SAndroid Build Coastguard Workerpolly.loop_exit: 33*9880d681SAndroid Build Coastguard Worker %1 = phi <2 x i32> [ zeroinitializer, %polly.loop_if ], [ %addp_vec, %polly.loop_exit.loopexit ] 34*9880d681SAndroid Build Coastguard Worker %2 = extractelement <2 x i32> %1, i32 0 35*9880d681SAndroid Build Coastguard Worker %3 = extractelement <2 x i32> %1, i32 1 36*9880d681SAndroid Build Coastguard Worker %add_sum = add i32 %2, %3 37*9880d681SAndroid Build Coastguard Worker br label %polly.loop_if13 38*9880d681SAndroid Build Coastguard Worker 39*9880d681SAndroid Build Coastguard Workerpolly.loop_if: 40*9880d681SAndroid Build Coastguard Worker %4 = add i32 %count, -1 41*9880d681SAndroid Build Coastguard Worker %leftover_lb = and i32 %4, -2 42*9880d681SAndroid Build Coastguard Worker %polly.loop_guard = icmp eq i32 %leftover_lb, 0 43*9880d681SAndroid Build Coastguard Worker br i1 %polly.loop_guard, label %polly.loop_exit, label %polly.loop_preheader 44*9880d681SAndroid Build Coastguard Worker 45*9880d681SAndroid Build Coastguard Workerpolly.stmt.for.body: 46*9880d681SAndroid Build Coastguard Worker %addp_vec28 = phi <2 x i32> [ zeroinitializer, %polly.loop_preheader ], [ %addp_vec, %polly.stmt.for.body ] 47*9880d681SAndroid Build Coastguard Worker %scevgep.phi = phi i32* [ getelementptr inbounds ([1000 x i32], [1000 x i32]* @A, i32 0, i32 0), %polly.loop_preheader ], [ %scevgep.inc, %polly.stmt.for.body ] 48*9880d681SAndroid Build Coastguard Worker %scevgep9.phi = phi i32* [ getelementptr inbounds ([1000 x i32], [1000 x i32]* @B, i32 0, i32 0), %polly.loop_preheader ], [ %scevgep9.inc, %polly.stmt.for.body ] 49*9880d681SAndroid Build Coastguard Worker %polly.indvar = phi i32 [ 0, %polly.loop_preheader ], [ %polly.indvar_next, %polly.stmt.for.body ] 50*9880d681SAndroid Build Coastguard Worker %vector_ptr = bitcast i32* %scevgep.phi to <2 x i32>* 51*9880d681SAndroid Build Coastguard Worker %_p_vec_full = load <2 x i32>, <2 x i32>* %vector_ptr, align 8 52*9880d681SAndroid Build Coastguard Worker %vector_ptr10 = bitcast i32* %scevgep9.phi to <2 x i32>* 53*9880d681SAndroid Build Coastguard Worker %_p_vec_full11 = load <2 x i32>, <2 x i32>* %vector_ptr10, align 8 54*9880d681SAndroid Build Coastguard Worker %mulp_vec = mul <2 x i32> %_p_vec_full11, %_p_vec_full 55*9880d681SAndroid Build Coastguard Worker %addp_vec = add <2 x i32> %mulp_vec, %addp_vec28 56*9880d681SAndroid Build Coastguard Worker %polly.indvar_next = add nsw i32 %polly.indvar, 2 57*9880d681SAndroid Build Coastguard Worker %polly.loop_cond = icmp eq i32 %polly.indvar, %polly.adjust_ub 58*9880d681SAndroid Build Coastguard Worker %scevgep.inc = getelementptr i32, i32* %scevgep.phi, i32 2 59*9880d681SAndroid Build Coastguard Worker %scevgep9.inc = getelementptr i32, i32* %scevgep9.phi, i32 2 60*9880d681SAndroid Build Coastguard Worker br i1 %polly.loop_cond, label %polly.loop_exit.loopexit, label %polly.stmt.for.body 61*9880d681SAndroid Build Coastguard Worker 62*9880d681SAndroid Build Coastguard Workerpolly.loop_preheader: 63*9880d681SAndroid Build Coastguard Worker %polly.adjust_ub = add i32 %leftover_lb, -2 64*9880d681SAndroid Build Coastguard Worker br label %polly.stmt.for.body 65*9880d681SAndroid Build Coastguard Worker 66*9880d681SAndroid Build Coastguard Workerpolly.loop_if13: 67*9880d681SAndroid Build Coastguard Worker %p_add34 = phi i32 [ 0, %polly.cond ], [ %add_sum, %polly.loop_exit ] 68*9880d681SAndroid Build Coastguard Worker %merge.lb = phi i32 [ 0, %polly.cond ], [ %leftover_lb, %polly.loop_exit ] 69*9880d681SAndroid Build Coastguard Worker %polly.loop_guard17 = icmp slt i32 %merge.lb, %count 70*9880d681SAndroid Build Coastguard Worker br i1 %polly.loop_guard17, label %polly.loop_preheader15, label %for.end 71*9880d681SAndroid Build Coastguard Worker 72*9880d681SAndroid Build Coastguard Workerpolly.stmt.for.body22: 73*9880d681SAndroid Build Coastguard Worker %p_add30 = phi i32 [ %p_add34, %polly.loop_preheader15 ], [ %p_add, %polly.stmt.for.body22 ] 74*9880d681SAndroid Build Coastguard Worker %polly.indvar18 = phi i32 [ %merge.lb, %polly.loop_preheader15 ], [ %polly.indvar_next19, %polly.stmt.for.body22 ] 75*9880d681SAndroid Build Coastguard Worker %5 = tail call i32 @llvm.annotation.i32(i32 %polly.indvar18, i8* null, i8* null, i32 0), !polly.loop.smallTripCount !0 76*9880d681SAndroid Build Coastguard Worker %scevgep23 = getelementptr [1000 x i32], [1000 x i32]* @A, i32 0, i32 %polly.indvar18 77*9880d681SAndroid Build Coastguard Worker %_p_scalar_ = load i32, i32* %scevgep23, align 4 78*9880d681SAndroid Build Coastguard Worker %scevgep24 = getelementptr [1000 x i32], [1000 x i32]* @B, i32 0, i32 %polly.indvar18 79*9880d681SAndroid Build Coastguard Worker %_p_scalar_25 = load i32, i32* %scevgep24, align 4 80*9880d681SAndroid Build Coastguard Worker %p_mul = mul nsw i32 %_p_scalar_25, %_p_scalar_ 81*9880d681SAndroid Build Coastguard Worker %p_add = add nsw i32 %p_mul, %p_add30 82*9880d681SAndroid Build Coastguard Worker %polly.indvar_next19 = add nsw i32 %polly.indvar18, 1 83*9880d681SAndroid Build Coastguard Worker %polly.loop_cond21 = icmp slt i32 %polly.indvar18, %polly.adjust_ub20 84*9880d681SAndroid Build Coastguard Worker br i1 %polly.loop_cond21, label %polly.stmt.for.body22, label %for.end.loopexit 85*9880d681SAndroid Build Coastguard Worker 86*9880d681SAndroid Build Coastguard Workerpolly.loop_preheader15: 87*9880d681SAndroid Build Coastguard Worker %polly.adjust_ub20 = add i32 %count, -1 88*9880d681SAndroid Build Coastguard Worker br label %polly.stmt.for.body22 89*9880d681SAndroid Build Coastguard Worker} 90*9880d681SAndroid Build Coastguard Worker 91*9880d681SAndroid Build Coastguard Workerdeclare i32 @llvm.annotation.i32(i32, i8*, i8*, i32) #1 92*9880d681SAndroid Build Coastguard Worker 93*9880d681SAndroid Build Coastguard Worker!0 = !{} 94