1*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=hexagon -mcpu=hexagonv5 -enable-pipeliner < %s | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=hexagon -mcpu=hexagonv5 -O2 < %s | FileCheck %s 3*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=hexagon -mcpu=hexagonv5 -O3 < %s | FileCheck %s 4*9880d681SAndroid Build Coastguard Worker; 5*9880d681SAndroid Build Coastguard Worker; Check that we pipeline a vectorized dot product in a single packet. 6*9880d681SAndroid Build Coastguard Worker; 7*9880d681SAndroid Build Coastguard Worker; CHECK: { 8*9880d681SAndroid Build Coastguard Worker; CHECK: += mpyi 9*9880d681SAndroid Build Coastguard Worker; CHECK: += mpyi 10*9880d681SAndroid Build Coastguard Worker; CHECK: memd 11*9880d681SAndroid Build Coastguard Worker; CHECK: memd 12*9880d681SAndroid Build Coastguard Worker; CHECK: } :endloop0 13*9880d681SAndroid Build Coastguard Worker 14*9880d681SAndroid Build Coastguard Worker@a = common global [5000 x i32] zeroinitializer, align 8 15*9880d681SAndroid Build Coastguard Worker@b = common global [5000 x i32] zeroinitializer, align 8 16*9880d681SAndroid Build Coastguard Worker 17*9880d681SAndroid Build Coastguard Workerdefine i32 @vecMultGlobal() { 18*9880d681SAndroid Build Coastguard Workerentry: 19*9880d681SAndroid Build Coastguard Worker br label %polly.loop_body 20*9880d681SAndroid Build Coastguard Worker 21*9880d681SAndroid Build Coastguard Workerpolly.loop_after: 22*9880d681SAndroid Build Coastguard Worker %0 = extractelement <2 x i32> %addp_vec, i32 0 23*9880d681SAndroid Build Coastguard Worker %1 = extractelement <2 x i32> %addp_vec, i32 1 24*9880d681SAndroid Build Coastguard Worker %add_sum = add i32 %0, %1 25*9880d681SAndroid Build Coastguard Worker ret i32 %add_sum 26*9880d681SAndroid Build Coastguard Worker 27*9880d681SAndroid Build Coastguard Workerpolly.loop_body: 28*9880d681SAndroid Build Coastguard Worker %polly.loopiv13 = phi i32 [ 0, %entry ], [ %polly.next_loopiv, %polly.loop_body ] 29*9880d681SAndroid Build Coastguard Worker %reduction.012 = phi <2 x i32> [ zeroinitializer, %entry ], [ %addp_vec, %polly.loop_body ] 30*9880d681SAndroid Build Coastguard Worker %polly.next_loopiv = add nsw i32 %polly.loopiv13, 2 31*9880d681SAndroid Build Coastguard Worker %p_arrayidx1 = getelementptr [5000 x i32], [5000 x i32]* @b, i32 0, i32 %polly.loopiv13 32*9880d681SAndroid Build Coastguard Worker %p_arrayidx = getelementptr [5000 x i32], [5000 x i32]* @a, i32 0, i32 %polly.loopiv13 33*9880d681SAndroid Build Coastguard Worker %vector_ptr = bitcast i32* %p_arrayidx1 to <2 x i32>* 34*9880d681SAndroid Build Coastguard Worker %_p_vec_full = load <2 x i32>, <2 x i32>* %vector_ptr, align 8 35*9880d681SAndroid Build Coastguard Worker %vector_ptr7 = bitcast i32* %p_arrayidx to <2 x i32>* 36*9880d681SAndroid Build Coastguard Worker %_p_vec_full8 = load <2 x i32>, <2 x i32>* %vector_ptr7, align 8 37*9880d681SAndroid Build Coastguard Worker %mulp_vec = mul <2 x i32> %_p_vec_full8, %_p_vec_full 38*9880d681SAndroid Build Coastguard Worker %addp_vec = add <2 x i32> %mulp_vec, %reduction.012 39*9880d681SAndroid Build Coastguard Worker %2 = icmp slt i32 %polly.next_loopiv, 5000 40*9880d681SAndroid Build Coastguard Worker br i1 %2, label %polly.loop_body, label %polly.loop_after 41*9880d681SAndroid Build Coastguard Worker} 42