1*9880d681SAndroid Build Coastguard Worker; RUN: llc -O3 -mcpu=pwr8 -mtriple=powerpc64le-unknown-linux-gnu < %s | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker; RUN: llc -O3 -mcpu=pwr8 -disable-ppc-vsx-swap-removal -mtriple=powerpc64le-unknown-linux-gnu < %s | FileCheck -check-prefix=NOOPTSWAP %s 3*9880d681SAndroid Build Coastguard Worker 4*9880d681SAndroid Build Coastguard Worker; This test was generated from the following source: 5*9880d681SAndroid Build Coastguard Worker; 6*9880d681SAndroid Build Coastguard Worker; #define N 4096 7*9880d681SAndroid Build Coastguard Worker; int ca[N] __attribute__((aligned(16))); 8*9880d681SAndroid Build Coastguard Worker; int cb[N] __attribute__((aligned(16))); 9*9880d681SAndroid Build Coastguard Worker; int cc[N] __attribute__((aligned(16))); 10*9880d681SAndroid Build Coastguard Worker; int cd[N] __attribute__((aligned(16))); 11*9880d681SAndroid Build Coastguard Worker; 12*9880d681SAndroid Build Coastguard Worker; void foo () 13*9880d681SAndroid Build Coastguard Worker; { 14*9880d681SAndroid Build Coastguard Worker; int i; 15*9880d681SAndroid Build Coastguard Worker; for (i = 0; i < N; i++) { 16*9880d681SAndroid Build Coastguard Worker; ca[i] = (cb[i] + cc[i]) * cd[i]; 17*9880d681SAndroid Build Coastguard Worker; } 18*9880d681SAndroid Build Coastguard Worker; } 19*9880d681SAndroid Build Coastguard Worker 20*9880d681SAndroid Build Coastguard Worker@cb = common global [4096 x i32] zeroinitializer, align 16 21*9880d681SAndroid Build Coastguard Worker@cc = common global [4096 x i32] zeroinitializer, align 16 22*9880d681SAndroid Build Coastguard Worker@cd = common global [4096 x i32] zeroinitializer, align 16 23*9880d681SAndroid Build Coastguard Worker@ca = common global [4096 x i32] zeroinitializer, align 16 24*9880d681SAndroid Build Coastguard Worker 25*9880d681SAndroid Build Coastguard Workerdefine void @foo() { 26*9880d681SAndroid Build Coastguard Workerentry: 27*9880d681SAndroid Build Coastguard Worker br label %vector.body 28*9880d681SAndroid Build Coastguard Worker 29*9880d681SAndroid Build Coastguard Workervector.body: 30*9880d681SAndroid Build Coastguard Worker %index = phi i64 [ 0, %entry ], [ %index.next.3, %vector.body ] 31*9880d681SAndroid Build Coastguard Worker %0 = getelementptr inbounds [4096 x i32], [4096 x i32]* @cb, i64 0, i64 %index 32*9880d681SAndroid Build Coastguard Worker %1 = bitcast i32* %0 to <4 x i32>* 33*9880d681SAndroid Build Coastguard Worker %wide.load = load <4 x i32>, <4 x i32>* %1, align 16 34*9880d681SAndroid Build Coastguard Worker %2 = getelementptr inbounds [4096 x i32], [4096 x i32]* @cc, i64 0, i64 %index 35*9880d681SAndroid Build Coastguard Worker %3 = bitcast i32* %2 to <4 x i32>* 36*9880d681SAndroid Build Coastguard Worker %wide.load13 = load <4 x i32>, <4 x i32>* %3, align 16 37*9880d681SAndroid Build Coastguard Worker %4 = add nsw <4 x i32> %wide.load13, %wide.load 38*9880d681SAndroid Build Coastguard Worker %5 = getelementptr inbounds [4096 x i32], [4096 x i32]* @cd, i64 0, i64 %index 39*9880d681SAndroid Build Coastguard Worker %6 = bitcast i32* %5 to <4 x i32>* 40*9880d681SAndroid Build Coastguard Worker %wide.load14 = load <4 x i32>, <4 x i32>* %6, align 16 41*9880d681SAndroid Build Coastguard Worker %7 = mul nsw <4 x i32> %4, %wide.load14 42*9880d681SAndroid Build Coastguard Worker %8 = getelementptr inbounds [4096 x i32], [4096 x i32]* @ca, i64 0, i64 %index 43*9880d681SAndroid Build Coastguard Worker %9 = bitcast i32* %8 to <4 x i32>* 44*9880d681SAndroid Build Coastguard Worker store <4 x i32> %7, <4 x i32>* %9, align 16 45*9880d681SAndroid Build Coastguard Worker %index.next = add nuw nsw i64 %index, 4 46*9880d681SAndroid Build Coastguard Worker %10 = getelementptr inbounds [4096 x i32], [4096 x i32]* @cb, i64 0, i64 %index.next 47*9880d681SAndroid Build Coastguard Worker %11 = bitcast i32* %10 to <4 x i32>* 48*9880d681SAndroid Build Coastguard Worker %wide.load.1 = load <4 x i32>, <4 x i32>* %11, align 16 49*9880d681SAndroid Build Coastguard Worker %12 = getelementptr inbounds [4096 x i32], [4096 x i32]* @cc, i64 0, i64 %index.next 50*9880d681SAndroid Build Coastguard Worker %13 = bitcast i32* %12 to <4 x i32>* 51*9880d681SAndroid Build Coastguard Worker %wide.load13.1 = load <4 x i32>, <4 x i32>* %13, align 16 52*9880d681SAndroid Build Coastguard Worker %14 = add nsw <4 x i32> %wide.load13.1, %wide.load.1 53*9880d681SAndroid Build Coastguard Worker %15 = getelementptr inbounds [4096 x i32], [4096 x i32]* @cd, i64 0, i64 %index.next 54*9880d681SAndroid Build Coastguard Worker %16 = bitcast i32* %15 to <4 x i32>* 55*9880d681SAndroid Build Coastguard Worker %wide.load14.1 = load <4 x i32>, <4 x i32>* %16, align 16 56*9880d681SAndroid Build Coastguard Worker %17 = mul nsw <4 x i32> %14, %wide.load14.1 57*9880d681SAndroid Build Coastguard Worker %18 = getelementptr inbounds [4096 x i32], [4096 x i32]* @ca, i64 0, i64 %index.next 58*9880d681SAndroid Build Coastguard Worker %19 = bitcast i32* %18 to <4 x i32>* 59*9880d681SAndroid Build Coastguard Worker store <4 x i32> %17, <4 x i32>* %19, align 16 60*9880d681SAndroid Build Coastguard Worker %index.next.1 = add nuw nsw i64 %index.next, 4 61*9880d681SAndroid Build Coastguard Worker %20 = getelementptr inbounds [4096 x i32], [4096 x i32]* @cb, i64 0, i64 %index.next.1 62*9880d681SAndroid Build Coastguard Worker %21 = bitcast i32* %20 to <4 x i32>* 63*9880d681SAndroid Build Coastguard Worker %wide.load.2 = load <4 x i32>, <4 x i32>* %21, align 16 64*9880d681SAndroid Build Coastguard Worker %22 = getelementptr inbounds [4096 x i32], [4096 x i32]* @cc, i64 0, i64 %index.next.1 65*9880d681SAndroid Build Coastguard Worker %23 = bitcast i32* %22 to <4 x i32>* 66*9880d681SAndroid Build Coastguard Worker %wide.load13.2 = load <4 x i32>, <4 x i32>* %23, align 16 67*9880d681SAndroid Build Coastguard Worker %24 = add nsw <4 x i32> %wide.load13.2, %wide.load.2 68*9880d681SAndroid Build Coastguard Worker %25 = getelementptr inbounds [4096 x i32], [4096 x i32]* @cd, i64 0, i64 %index.next.1 69*9880d681SAndroid Build Coastguard Worker %26 = bitcast i32* %25 to <4 x i32>* 70*9880d681SAndroid Build Coastguard Worker %wide.load14.2 = load <4 x i32>, <4 x i32>* %26, align 16 71*9880d681SAndroid Build Coastguard Worker %27 = mul nsw <4 x i32> %24, %wide.load14.2 72*9880d681SAndroid Build Coastguard Worker %28 = getelementptr inbounds [4096 x i32], [4096 x i32]* @ca, i64 0, i64 %index.next.1 73*9880d681SAndroid Build Coastguard Worker %29 = bitcast i32* %28 to <4 x i32>* 74*9880d681SAndroid Build Coastguard Worker store <4 x i32> %27, <4 x i32>* %29, align 16 75*9880d681SAndroid Build Coastguard Worker %index.next.2 = add nuw nsw i64 %index.next.1, 4 76*9880d681SAndroid Build Coastguard Worker %30 = getelementptr inbounds [4096 x i32], [4096 x i32]* @cb, i64 0, i64 %index.next.2 77*9880d681SAndroid Build Coastguard Worker %31 = bitcast i32* %30 to <4 x i32>* 78*9880d681SAndroid Build Coastguard Worker %wide.load.3 = load <4 x i32>, <4 x i32>* %31, align 16 79*9880d681SAndroid Build Coastguard Worker %32 = getelementptr inbounds [4096 x i32], [4096 x i32]* @cc, i64 0, i64 %index.next.2 80*9880d681SAndroid Build Coastguard Worker %33 = bitcast i32* %32 to <4 x i32>* 81*9880d681SAndroid Build Coastguard Worker %wide.load13.3 = load <4 x i32>, <4 x i32>* %33, align 16 82*9880d681SAndroid Build Coastguard Worker %34 = add nsw <4 x i32> %wide.load13.3, %wide.load.3 83*9880d681SAndroid Build Coastguard Worker %35 = getelementptr inbounds [4096 x i32], [4096 x i32]* @cd, i64 0, i64 %index.next.2 84*9880d681SAndroid Build Coastguard Worker %36 = bitcast i32* %35 to <4 x i32>* 85*9880d681SAndroid Build Coastguard Worker %wide.load14.3 = load <4 x i32>, <4 x i32>* %36, align 16 86*9880d681SAndroid Build Coastguard Worker %37 = mul nsw <4 x i32> %34, %wide.load14.3 87*9880d681SAndroid Build Coastguard Worker %38 = getelementptr inbounds [4096 x i32], [4096 x i32]* @ca, i64 0, i64 %index.next.2 88*9880d681SAndroid Build Coastguard Worker %39 = bitcast i32* %38 to <4 x i32>* 89*9880d681SAndroid Build Coastguard Worker store <4 x i32> %37, <4 x i32>* %39, align 16 90*9880d681SAndroid Build Coastguard Worker %index.next.3 = add nuw nsw i64 %index.next.2, 4 91*9880d681SAndroid Build Coastguard Worker %40 = icmp eq i64 %index.next.3, 4096 92*9880d681SAndroid Build Coastguard Worker br i1 %40, label %for.end, label %vector.body 93*9880d681SAndroid Build Coastguard Worker 94*9880d681SAndroid Build Coastguard Workerfor.end: 95*9880d681SAndroid Build Coastguard Worker ret void 96*9880d681SAndroid Build Coastguard Worker} 97*9880d681SAndroid Build Coastguard Worker 98*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @foo 99*9880d681SAndroid Build Coastguard Worker; CHECK-NOT: xxpermdi 100*9880d681SAndroid Build Coastguard Worker; CHECK-NOT: xxswapd 101*9880d681SAndroid Build Coastguard Worker 102*9880d681SAndroid Build Coastguard Worker; CHECK: lxvd2x 103*9880d681SAndroid Build Coastguard Worker; CHECK: lxvd2x 104*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: lxvd2x 105*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vadduwm 106*9880d681SAndroid Build Coastguard Worker; CHECK: vmuluwm 107*9880d681SAndroid Build Coastguard Worker; CHECK: stxvd2x 108*9880d681SAndroid Build Coastguard Worker 109*9880d681SAndroid Build Coastguard Worker; CHECK: lxvd2x 110*9880d681SAndroid Build Coastguard Worker; CHECK: lxvd2x 111*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: lxvd2x 112*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vadduwm 113*9880d681SAndroid Build Coastguard Worker; CHECK: vmuluwm 114*9880d681SAndroid Build Coastguard Worker; CHECK: stxvd2x 115*9880d681SAndroid Build Coastguard Worker 116*9880d681SAndroid Build Coastguard Worker; CHECK: lxvd2x 117*9880d681SAndroid Build Coastguard Worker; CHECK: lxvd2x 118*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: lxvd2x 119*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vadduwm 120*9880d681SAndroid Build Coastguard Worker; CHECK: vmuluwm 121*9880d681SAndroid Build Coastguard Worker; CHECK: stxvd2x 122*9880d681SAndroid Build Coastguard Worker 123*9880d681SAndroid Build Coastguard Worker; CHECK: lxvd2x 124*9880d681SAndroid Build Coastguard Worker; CHECK: lxvd2x 125*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: lxvd2x 126*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vadduwm 127*9880d681SAndroid Build Coastguard Worker; CHECK: vmuluwm 128*9880d681SAndroid Build Coastguard Worker; CHECK: stxvd2x 129*9880d681SAndroid Build Coastguard Worker 130*9880d681SAndroid Build Coastguard Worker 131*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP-LABEL: @foo 132*9880d681SAndroid Build Coastguard Worker 133*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP: lxvd2x 134*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP-DAG: lxvd2x 135*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP-DAG: lxvd2x 136*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP-DAG: xxswapd 137*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP-DAG: xxswapd 138*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP-DAG: xxswapd 139*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP-DAG: vadduwm 140*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP: vmuluwm 141*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP: xxswapd 142*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP-DAG: xxswapd 143*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP-DAG: xxswapd 144*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP-DAG: stxvd2x 145*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP-DAG: stxvd2x 146*9880d681SAndroid Build Coastguard Worker; NOOPTSWAP: stxvd2x 147*9880d681SAndroid Build Coastguard Worker 148