1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=arm64 -aarch64-neon-syntax=apple | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker 3*9880d681SAndroid Build Coastguard Workerdefine <8 x i8> @vzipi8(<8 x i8>* %A, <8 x i8>* %B) nounwind { 4*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipi8: 5*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.8b 6*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.8b 7*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.8b 8*9880d681SAndroid Build Coastguard Worker %tmp1 = load <8 x i8>, <8 x i8>* %A 9*9880d681SAndroid Build Coastguard Worker %tmp2 = load <8 x i8>, <8 x i8>* %B 10*9880d681SAndroid Build Coastguard Worker %tmp3 = shufflevector <8 x i8> %tmp1, <8 x i8> %tmp2, <8 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11> 11*9880d681SAndroid Build Coastguard Worker %tmp4 = shufflevector <8 x i8> %tmp1, <8 x i8> %tmp2, <8 x i32> <i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15> 12*9880d681SAndroid Build Coastguard Worker %tmp5 = add <8 x i8> %tmp3, %tmp4 13*9880d681SAndroid Build Coastguard Worker ret <8 x i8> %tmp5 14*9880d681SAndroid Build Coastguard Worker} 15*9880d681SAndroid Build Coastguard Worker 16*9880d681SAndroid Build Coastguard Workerdefine <4 x i16> @vzipi16(<4 x i16>* %A, <4 x i16>* %B) nounwind { 17*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipi16: 18*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.4h 19*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.4h 20*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.4h 21*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x i16>, <4 x i16>* %A 22*9880d681SAndroid Build Coastguard Worker %tmp2 = load <4 x i16>, <4 x i16>* %B 23*9880d681SAndroid Build Coastguard Worker %tmp3 = shufflevector <4 x i16> %tmp1, <4 x i16> %tmp2, <4 x i32> <i32 0, i32 4, i32 1, i32 5> 24*9880d681SAndroid Build Coastguard Worker %tmp4 = shufflevector <4 x i16> %tmp1, <4 x i16> %tmp2, <4 x i32> <i32 2, i32 6, i32 3, i32 7> 25*9880d681SAndroid Build Coastguard Worker %tmp5 = add <4 x i16> %tmp3, %tmp4 26*9880d681SAndroid Build Coastguard Worker ret <4 x i16> %tmp5 27*9880d681SAndroid Build Coastguard Worker} 28*9880d681SAndroid Build Coastguard Worker 29*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @vzipQi8(<16 x i8>* %A, <16 x i8>* %B) nounwind { 30*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipQi8: 31*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.16b 32*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.16b 33*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.16b 34*9880d681SAndroid Build Coastguard Worker %tmp1 = load <16 x i8>, <16 x i8>* %A 35*9880d681SAndroid Build Coastguard Worker %tmp2 = load <16 x i8>, <16 x i8>* %B 36*9880d681SAndroid Build Coastguard Worker %tmp3 = shufflevector <16 x i8> %tmp1, <16 x i8> %tmp2, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23> 37*9880d681SAndroid Build Coastguard Worker %tmp4 = shufflevector <16 x i8> %tmp1, <16 x i8> %tmp2, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31> 38*9880d681SAndroid Build Coastguard Worker %tmp5 = add <16 x i8> %tmp3, %tmp4 39*9880d681SAndroid Build Coastguard Worker ret <16 x i8> %tmp5 40*9880d681SAndroid Build Coastguard Worker} 41*9880d681SAndroid Build Coastguard Worker 42*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @vzipQi16(<8 x i16>* %A, <8 x i16>* %B) nounwind { 43*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipQi16: 44*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.8h 45*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.8h 46*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.8h 47*9880d681SAndroid Build Coastguard Worker %tmp1 = load <8 x i16>, <8 x i16>* %A 48*9880d681SAndroid Build Coastguard Worker %tmp2 = load <8 x i16>, <8 x i16>* %B 49*9880d681SAndroid Build Coastguard Worker %tmp3 = shufflevector <8 x i16> %tmp1, <8 x i16> %tmp2, <8 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11> 50*9880d681SAndroid Build Coastguard Worker %tmp4 = shufflevector <8 x i16> %tmp1, <8 x i16> %tmp2, <8 x i32> <i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15> 51*9880d681SAndroid Build Coastguard Worker %tmp5 = add <8 x i16> %tmp3, %tmp4 52*9880d681SAndroid Build Coastguard Worker ret <8 x i16> %tmp5 53*9880d681SAndroid Build Coastguard Worker} 54*9880d681SAndroid Build Coastguard Worker 55*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @vzipQi32(<4 x i32>* %A, <4 x i32>* %B) nounwind { 56*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipQi32: 57*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.4s 58*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.4s 59*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.4s 60*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x i32>, <4 x i32>* %A 61*9880d681SAndroid Build Coastguard Worker %tmp2 = load <4 x i32>, <4 x i32>* %B 62*9880d681SAndroid Build Coastguard Worker %tmp3 = shufflevector <4 x i32> %tmp1, <4 x i32> %tmp2, <4 x i32> <i32 0, i32 4, i32 1, i32 5> 63*9880d681SAndroid Build Coastguard Worker %tmp4 = shufflevector <4 x i32> %tmp1, <4 x i32> %tmp2, <4 x i32> <i32 2, i32 6, i32 3, i32 7> 64*9880d681SAndroid Build Coastguard Worker %tmp5 = add <4 x i32> %tmp3, %tmp4 65*9880d681SAndroid Build Coastguard Worker ret <4 x i32> %tmp5 66*9880d681SAndroid Build Coastguard Worker} 67*9880d681SAndroid Build Coastguard Worker 68*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @vzipQf(<4 x float>* %A, <4 x float>* %B) nounwind { 69*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipQf: 70*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.4s 71*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.4s 72*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: fadd.4s 73*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x float>, <4 x float>* %A 74*9880d681SAndroid Build Coastguard Worker %tmp2 = load <4 x float>, <4 x float>* %B 75*9880d681SAndroid Build Coastguard Worker %tmp3 = shufflevector <4 x float> %tmp1, <4 x float> %tmp2, <4 x i32> <i32 0, i32 4, i32 1, i32 5> 76*9880d681SAndroid Build Coastguard Worker %tmp4 = shufflevector <4 x float> %tmp1, <4 x float> %tmp2, <4 x i32> <i32 2, i32 6, i32 3, i32 7> 77*9880d681SAndroid Build Coastguard Worker %tmp5 = fadd <4 x float> %tmp3, %tmp4 78*9880d681SAndroid Build Coastguard Worker ret <4 x float> %tmp5 79*9880d681SAndroid Build Coastguard Worker} 80*9880d681SAndroid Build Coastguard Worker 81*9880d681SAndroid Build Coastguard Worker; Undef shuffle indices should not prevent matching to VZIP: 82*9880d681SAndroid Build Coastguard Worker 83*9880d681SAndroid Build Coastguard Workerdefine <8 x i8> @vzipi8_undef(<8 x i8>* %A, <8 x i8>* %B) nounwind { 84*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipi8_undef: 85*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.8b 86*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.8b 87*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.8b 88*9880d681SAndroid Build Coastguard Worker %tmp1 = load <8 x i8>, <8 x i8>* %A 89*9880d681SAndroid Build Coastguard Worker %tmp2 = load <8 x i8>, <8 x i8>* %B 90*9880d681SAndroid Build Coastguard Worker %tmp3 = shufflevector <8 x i8> %tmp1, <8 x i8> %tmp2, <8 x i32> <i32 0, i32 undef, i32 1, i32 9, i32 undef, i32 10, i32 3, i32 11> 91*9880d681SAndroid Build Coastguard Worker %tmp4 = shufflevector <8 x i8> %tmp1, <8 x i8> %tmp2, <8 x i32> <i32 4, i32 12, i32 5, i32 13, i32 6, i32 undef, i32 undef, i32 15> 92*9880d681SAndroid Build Coastguard Worker %tmp5 = add <8 x i8> %tmp3, %tmp4 93*9880d681SAndroid Build Coastguard Worker ret <8 x i8> %tmp5 94*9880d681SAndroid Build Coastguard Worker} 95*9880d681SAndroid Build Coastguard Worker 96*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @vzipQi8_undef(<16 x i8>* %A, <16 x i8>* %B) nounwind { 97*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipQi8_undef: 98*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.16b 99*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.16b 100*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.16b 101*9880d681SAndroid Build Coastguard Worker %tmp1 = load <16 x i8>, <16 x i8>* %A 102*9880d681SAndroid Build Coastguard Worker %tmp2 = load <16 x i8>, <16 x i8>* %B 103*9880d681SAndroid Build Coastguard Worker %tmp3 = shufflevector <16 x i8> %tmp1, <16 x i8> %tmp2, <16 x i32> <i32 0, i32 16, i32 1, i32 undef, i32 undef, i32 undef, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23> 104*9880d681SAndroid Build Coastguard Worker %tmp4 = shufflevector <16 x i8> %tmp1, <16 x i8> %tmp2, <16 x i32> <i32 8, i32 24, i32 9, i32 undef, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 undef, i32 14, i32 30, i32 undef, i32 31> 105*9880d681SAndroid Build Coastguard Worker %tmp5 = add <16 x i8> %tmp3, %tmp4 106*9880d681SAndroid Build Coastguard Worker ret <16 x i8> %tmp5 107*9880d681SAndroid Build Coastguard Worker} 108