xref: /aosp_15_r20/external/llvm/test/CodeGen/AArch64/trunc-v1i64.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; RUN: llc -mtriple=aarch64-none-linux-gnu -mattr=+neon -verify-machineinstrs < %s | FileCheck %s
2*9880d681SAndroid Build Coastguard Worker
3*9880d681SAndroid Build Coastguard Worker; An optimization in DAG Combiner to fold
4*9880d681SAndroid Build Coastguard Worker; (trunc (concat ... x ...)) -> (concat ..., (trunc x), ...))
5*9880d681SAndroid Build Coastguard Worker; will generate nodes like:
6*9880d681SAndroid Build Coastguard Worker;     v1i32 trunc v1i64, v1i16 trunc v1i64, v1i8 trunc v1i64.
7*9880d681SAndroid Build Coastguard Worker; And such nodes will be defaultly scalarized in type legalization. But such
8*9880d681SAndroid Build Coastguard Worker; scalarization will cause an assertion failure, as v1i64 is a legal type in
9*9880d681SAndroid Build Coastguard Worker; AArch64. We change the default behaviour from be scalarized to be widen.
10*9880d681SAndroid Build Coastguard Worker
11*9880d681SAndroid Build Coastguard Worker; FIXME: Currently XTN is generated for v1i32, but it can be optimized.
12*9880d681SAndroid Build Coastguard Worker; Just like v1i16 and v1i8, there is no XTN generated.
13*9880d681SAndroid Build Coastguard Worker
14*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @test_v1i32_0(<1 x i64> %in0) {
15*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_v1i32_0:
16*9880d681SAndroid Build Coastguard Worker; CHECK: xtn v0.2s, v0.2d
17*9880d681SAndroid Build Coastguard Worker  %1 = shufflevector <1 x i64> %in0, <1 x i64> undef, <2 x i32> <i32 0, i32 undef>
18*9880d681SAndroid Build Coastguard Worker  %2 = trunc <2 x i64> %1 to <2 x i32>
19*9880d681SAndroid Build Coastguard Worker  ret <2 x i32> %2
20*9880d681SAndroid Build Coastguard Worker}
21*9880d681SAndroid Build Coastguard Worker
22*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @test_v1i32_1(<1 x i64> %in0) {
23*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_v1i32_1:
24*9880d681SAndroid Build Coastguard Worker; CHECK: xtn v0.2s, v0.2d
25*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: dup v0.2s, v0.s[0]
26*9880d681SAndroid Build Coastguard Worker  %1 = shufflevector <1 x i64> %in0, <1 x i64> undef, <2 x i32> <i32 undef, i32 0>
27*9880d681SAndroid Build Coastguard Worker  %2 = trunc <2 x i64> %1 to <2 x i32>
28*9880d681SAndroid Build Coastguard Worker  ret <2 x i32> %2
29*9880d681SAndroid Build Coastguard Worker}
30*9880d681SAndroid Build Coastguard Worker
31*9880d681SAndroid Build Coastguard Workerdefine <4 x i16> @test_v1i16_0(<1 x i64> %in0) {
32*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_v1i16_0:
33*9880d681SAndroid Build Coastguard Worker; CHECK-NOT: xtn
34*9880d681SAndroid Build Coastguard Worker  %1 = shufflevector <1 x i64> %in0, <1 x i64> undef, <4 x i32> <i32 0, i32 undef, i32 undef, i32 undef>
35*9880d681SAndroid Build Coastguard Worker  %2 = trunc <4 x i64> %1 to <4 x i16>
36*9880d681SAndroid Build Coastguard Worker  ret <4 x i16> %2
37*9880d681SAndroid Build Coastguard Worker}
38*9880d681SAndroid Build Coastguard Worker
39*9880d681SAndroid Build Coastguard Workerdefine <4 x i16> @test_v1i16_1(<1 x i64> %in0) {
40*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_v1i16_1:
41*9880d681SAndroid Build Coastguard Worker; CHECK-NOT: xtn
42*9880d681SAndroid Build Coastguard Worker; CHECK: dup v0.4h, v0.h[0]
43*9880d681SAndroid Build Coastguard Worker  %1 = shufflevector <1 x i64> %in0, <1 x i64> undef, <4 x i32> <i32 undef, i32 undef, i32 0, i32 undef>
44*9880d681SAndroid Build Coastguard Worker  %2 = trunc <4 x i64> %1 to <4 x i16>
45*9880d681SAndroid Build Coastguard Worker  ret <4 x i16> %2
46*9880d681SAndroid Build Coastguard Worker}
47*9880d681SAndroid Build Coastguard Worker
48*9880d681SAndroid Build Coastguard Workerdefine <8 x i8> @test_v1i8_0(<1 x i64> %in0) {
49*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_v1i8_0:
50*9880d681SAndroid Build Coastguard Worker; CHECK-NOT: xtn
51*9880d681SAndroid Build Coastguard Worker  %1 = shufflevector <1 x i64> %in0, <1 x i64> undef, <8 x i32> <i32 0, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>
52*9880d681SAndroid Build Coastguard Worker  %2 = trunc <8 x i64> %1 to <8 x i8>
53*9880d681SAndroid Build Coastguard Worker  ret <8 x i8> %2
54*9880d681SAndroid Build Coastguard Worker}
55*9880d681SAndroid Build Coastguard Worker
56*9880d681SAndroid Build Coastguard Workerdefine <8 x i8> @test_v1i8_1(<1 x i64> %in0) {
57*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_v1i8_1:
58*9880d681SAndroid Build Coastguard Worker; CHECK-NOT: xtn
59*9880d681SAndroid Build Coastguard Worker; CHECK: dup v0.8b, v0.b[0]
60*9880d681SAndroid Build Coastguard Worker  %1 = shufflevector <1 x i64> %in0, <1 x i64> undef, <8 x i32> <i32 undef, i32 undef, i32 0, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>
61*9880d681SAndroid Build Coastguard Worker  %2 = trunc <8 x i64> %1 to <8 x i8>
62*9880d681SAndroid Build Coastguard Worker  ret <8 x i8> %2
63*9880d681SAndroid Build Coastguard Worker}
64*9880d681SAndroid Build Coastguard Worker
65*9880d681SAndroid Build Coastguard Worker; PR20777: v1i1 is also problematic, but we can't widen it, so we extract_elt
66*9880d681SAndroid Build Coastguard Worker; the i64 out of the v1i64 operand, and truncate that scalar instead.
67*9880d681SAndroid Build Coastguard Worker
68*9880d681SAndroid Build Coastguard Workerdefine <1 x i1> @test_v1i1_0(<1 x i64> %in0) {
69*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_v1i1_0:
70*9880d681SAndroid Build Coastguard Worker; CHECK: fmov w0, s0
71*9880d681SAndroid Build Coastguard Worker  %1 = trunc <1 x i64> %in0 to <1 x i1>
72*9880d681SAndroid Build Coastguard Worker  ret <1 x i1> %1
73*9880d681SAndroid Build Coastguard Worker}
74*9880d681SAndroid Build Coastguard Worker
75*9880d681SAndroid Build Coastguard Workerdefine i1 @test_v1i1_1(<1 x i64> %in0) {
76*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_v1i1_1:
77*9880d681SAndroid Build Coastguard Worker; CHECK: fmov [[REG:w[0-9]+]], s0
78*9880d681SAndroid Build Coastguard Worker  %1 = trunc <1 x i64> %in0 to <1 x i1>
79*9880d681SAndroid Build Coastguard Worker; CHECK: and w0, [[REG]], #0x1
80*9880d681SAndroid Build Coastguard Worker  %2 = extractelement <1 x i1> %1, i32 0
81*9880d681SAndroid Build Coastguard Worker  ret i1 %2
82*9880d681SAndroid Build Coastguard Worker}
83