xref: /aosp_15_r20/external/llvm/test/CodeGen/AArch64/arm64-zip.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=arm64 -aarch64-neon-syntax=apple | FileCheck %s
2*9880d681SAndroid Build Coastguard Worker
3*9880d681SAndroid Build Coastguard Workerdefine <8 x i8> @vzipi8(<8 x i8>* %A, <8 x i8>* %B) nounwind {
4*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipi8:
5*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.8b
6*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.8b
7*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.8b
8*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <8 x i8>, <8 x i8>* %A
9*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <8 x i8>, <8 x i8>* %B
10*9880d681SAndroid Build Coastguard Worker	%tmp3 = shufflevector <8 x i8> %tmp1, <8 x i8> %tmp2, <8 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11>
11*9880d681SAndroid Build Coastguard Worker	%tmp4 = shufflevector <8 x i8> %tmp1, <8 x i8> %tmp2, <8 x i32> <i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
12*9880d681SAndroid Build Coastguard Worker        %tmp5 = add <8 x i8> %tmp3, %tmp4
13*9880d681SAndroid Build Coastguard Worker	ret <8 x i8> %tmp5
14*9880d681SAndroid Build Coastguard Worker}
15*9880d681SAndroid Build Coastguard Worker
16*9880d681SAndroid Build Coastguard Workerdefine <4 x i16> @vzipi16(<4 x i16>* %A, <4 x i16>* %B) nounwind {
17*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipi16:
18*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.4h
19*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.4h
20*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.4h
21*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x i16>, <4 x i16>* %A
22*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <4 x i16>, <4 x i16>* %B
23*9880d681SAndroid Build Coastguard Worker	%tmp3 = shufflevector <4 x i16> %tmp1, <4 x i16> %tmp2, <4 x i32> <i32 0, i32 4, i32 1, i32 5>
24*9880d681SAndroid Build Coastguard Worker	%tmp4 = shufflevector <4 x i16> %tmp1, <4 x i16> %tmp2, <4 x i32> <i32 2, i32 6, i32 3, i32 7>
25*9880d681SAndroid Build Coastguard Worker        %tmp5 = add <4 x i16> %tmp3, %tmp4
26*9880d681SAndroid Build Coastguard Worker	ret <4 x i16> %tmp5
27*9880d681SAndroid Build Coastguard Worker}
28*9880d681SAndroid Build Coastguard Worker
29*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @vzipQi8(<16 x i8>* %A, <16 x i8>* %B) nounwind {
30*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipQi8:
31*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.16b
32*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.16b
33*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.16b
34*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <16 x i8>, <16 x i8>* %A
35*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <16 x i8>, <16 x i8>* %B
36*9880d681SAndroid Build Coastguard Worker	%tmp3 = shufflevector <16 x i8> %tmp1, <16 x i8> %tmp2, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
37*9880d681SAndroid Build Coastguard Worker	%tmp4 = shufflevector <16 x i8> %tmp1, <16 x i8> %tmp2, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
38*9880d681SAndroid Build Coastguard Worker        %tmp5 = add <16 x i8> %tmp3, %tmp4
39*9880d681SAndroid Build Coastguard Worker	ret <16 x i8> %tmp5
40*9880d681SAndroid Build Coastguard Worker}
41*9880d681SAndroid Build Coastguard Worker
42*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @vzipQi16(<8 x i16>* %A, <8 x i16>* %B) nounwind {
43*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipQi16:
44*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.8h
45*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.8h
46*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.8h
47*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <8 x i16>, <8 x i16>* %A
48*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <8 x i16>, <8 x i16>* %B
49*9880d681SAndroid Build Coastguard Worker	%tmp3 = shufflevector <8 x i16> %tmp1, <8 x i16> %tmp2, <8 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11>
50*9880d681SAndroid Build Coastguard Worker	%tmp4 = shufflevector <8 x i16> %tmp1, <8 x i16> %tmp2, <8 x i32> <i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
51*9880d681SAndroid Build Coastguard Worker        %tmp5 = add <8 x i16> %tmp3, %tmp4
52*9880d681SAndroid Build Coastguard Worker	ret <8 x i16> %tmp5
53*9880d681SAndroid Build Coastguard Worker}
54*9880d681SAndroid Build Coastguard Worker
55*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @vzipQi32(<4 x i32>* %A, <4 x i32>* %B) nounwind {
56*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipQi32:
57*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.4s
58*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.4s
59*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.4s
60*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x i32>, <4 x i32>* %A
61*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <4 x i32>, <4 x i32>* %B
62*9880d681SAndroid Build Coastguard Worker	%tmp3 = shufflevector <4 x i32> %tmp1, <4 x i32> %tmp2, <4 x i32> <i32 0, i32 4, i32 1, i32 5>
63*9880d681SAndroid Build Coastguard Worker	%tmp4 = shufflevector <4 x i32> %tmp1, <4 x i32> %tmp2, <4 x i32> <i32 2, i32 6, i32 3, i32 7>
64*9880d681SAndroid Build Coastguard Worker        %tmp5 = add <4 x i32> %tmp3, %tmp4
65*9880d681SAndroid Build Coastguard Worker	ret <4 x i32> %tmp5
66*9880d681SAndroid Build Coastguard Worker}
67*9880d681SAndroid Build Coastguard Worker
68*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @vzipQf(<4 x float>* %A, <4 x float>* %B) nounwind {
69*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipQf:
70*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.4s
71*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.4s
72*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: fadd.4s
73*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x float>, <4 x float>* %A
74*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <4 x float>, <4 x float>* %B
75*9880d681SAndroid Build Coastguard Worker	%tmp3 = shufflevector <4 x float> %tmp1, <4 x float> %tmp2, <4 x i32> <i32 0, i32 4, i32 1, i32 5>
76*9880d681SAndroid Build Coastguard Worker	%tmp4 = shufflevector <4 x float> %tmp1, <4 x float> %tmp2, <4 x i32> <i32 2, i32 6, i32 3, i32 7>
77*9880d681SAndroid Build Coastguard Worker        %tmp5 = fadd <4 x float> %tmp3, %tmp4
78*9880d681SAndroid Build Coastguard Worker	ret <4 x float> %tmp5
79*9880d681SAndroid Build Coastguard Worker}
80*9880d681SAndroid Build Coastguard Worker
81*9880d681SAndroid Build Coastguard Worker; Undef shuffle indices should not prevent matching to VZIP:
82*9880d681SAndroid Build Coastguard Worker
83*9880d681SAndroid Build Coastguard Workerdefine <8 x i8> @vzipi8_undef(<8 x i8>* %A, <8 x i8>* %B) nounwind {
84*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipi8_undef:
85*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.8b
86*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.8b
87*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.8b
88*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <8 x i8>, <8 x i8>* %A
89*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <8 x i8>, <8 x i8>* %B
90*9880d681SAndroid Build Coastguard Worker	%tmp3 = shufflevector <8 x i8> %tmp1, <8 x i8> %tmp2, <8 x i32> <i32 0, i32 undef, i32 1, i32 9, i32 undef, i32 10, i32 3, i32 11>
91*9880d681SAndroid Build Coastguard Worker	%tmp4 = shufflevector <8 x i8> %tmp1, <8 x i8> %tmp2, <8 x i32> <i32 4, i32 12, i32 5, i32 13, i32 6, i32 undef, i32 undef, i32 15>
92*9880d681SAndroid Build Coastguard Worker        %tmp5 = add <8 x i8> %tmp3, %tmp4
93*9880d681SAndroid Build Coastguard Worker	ret <8 x i8> %tmp5
94*9880d681SAndroid Build Coastguard Worker}
95*9880d681SAndroid Build Coastguard Worker
96*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @vzipQi8_undef(<16 x i8>* %A, <16 x i8>* %B) nounwind {
97*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vzipQi8_undef:
98*9880d681SAndroid Build Coastguard Worker;CHECK: zip1.16b
99*9880d681SAndroid Build Coastguard Worker;CHECK: zip2.16b
100*9880d681SAndroid Build Coastguard Worker;CHECK-NEXT: add.16b
101*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <16 x i8>, <16 x i8>* %A
102*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <16 x i8>, <16 x i8>* %B
103*9880d681SAndroid Build Coastguard Worker	%tmp3 = shufflevector <16 x i8> %tmp1, <16 x i8> %tmp2, <16 x i32> <i32 0, i32 16, i32 1, i32 undef, i32 undef, i32 undef, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
104*9880d681SAndroid Build Coastguard Worker	%tmp4 = shufflevector <16 x i8> %tmp1, <16 x i8> %tmp2, <16 x i32> <i32 8, i32 24, i32 9, i32 undef, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 undef, i32 14, i32 30, i32 undef, i32 31>
105*9880d681SAndroid Build Coastguard Worker        %tmp5 = add <16 x i8> %tmp3, %tmp4
106*9880d681SAndroid Build Coastguard Worker	ret <16 x i8> %tmp5
107*9880d681SAndroid Build Coastguard Worker}
108