1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -verify-machineinstrs -march=arm64 -aarch64-neon-syntax=apple -aarch64-simd-scalar=true -asm-verbose=false -disable-adv-copy-opt=true | FileCheck %s -check-prefix=CHECK -check-prefix=CHECK-NOOPT 2*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -verify-machineinstrs -march=arm64 -aarch64-neon-syntax=apple -aarch64-simd-scalar=true -asm-verbose=false -disable-adv-copy-opt=false | FileCheck %s -check-prefix=CHECK -check-prefix=CHECK-OPT 3*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -verify-machineinstrs -march=arm64 -aarch64-neon-syntax=generic -aarch64-simd-scalar=true -asm-verbose=false -disable-adv-copy-opt=true | FileCheck %s -check-prefix=GENERIC -check-prefix=GENERIC-NOOPT 4*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -verify-machineinstrs -march=arm64 -aarch64-neon-syntax=generic -aarch64-simd-scalar=true -asm-verbose=false -disable-adv-copy-opt=false | FileCheck %s -check-prefix=GENERIC -check-prefix=GENERIC-OPT 5*9880d681SAndroid Build Coastguard Worker 6*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @bar(<2 x i64> %a, <2 x i64> %b) nounwind readnone { 7*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: bar: 8*9880d681SAndroid Build Coastguard Worker; CHECK: add.2d v[[REG:[0-9]+]], v0, v1 9*9880d681SAndroid Build Coastguard Worker; CHECK: add d[[REG3:[0-9]+]], d[[REG]], d1 10*9880d681SAndroid Build Coastguard Worker; CHECK: sub d[[REG2:[0-9]+]], d[[REG]], d1 11*9880d681SAndroid Build Coastguard Worker; Without advanced copy optimization, we end up with cross register 12*9880d681SAndroid Build Coastguard Worker; banks copies that cannot be coalesced. 13*9880d681SAndroid Build Coastguard Worker; CHECK-NOOPT: fmov [[COPY_REG3:x[0-9]+]], d[[REG3]] 14*9880d681SAndroid Build Coastguard Worker; With advanced copy optimization, we end up with just one copy 15*9880d681SAndroid Build Coastguard Worker; to insert the computed high part into the V register. 16*9880d681SAndroid Build Coastguard Worker; CHECK-OPT-NOT: fmov 17*9880d681SAndroid Build Coastguard Worker; CHECK: fmov [[COPY_REG2:x[0-9]+]], d[[REG2]] 18*9880d681SAndroid Build Coastguard Worker; CHECK-NOOPT: fmov d0, [[COPY_REG3]] 19*9880d681SAndroid Build Coastguard Worker; CHECK-OPT-NOT: fmov 20*9880d681SAndroid Build Coastguard Worker; CHECK: ins.d v0[1], [[COPY_REG2]] 21*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret 22*9880d681SAndroid Build Coastguard Worker; 23*9880d681SAndroid Build Coastguard Worker; GENERIC-LABEL: bar: 24*9880d681SAndroid Build Coastguard Worker; GENERIC: add v[[REG:[0-9]+]].2d, v0.2d, v1.2d 25*9880d681SAndroid Build Coastguard Worker; GENERIC: add d[[REG3:[0-9]+]], d[[REG]], d1 26*9880d681SAndroid Build Coastguard Worker; GENERIC: sub d[[REG2:[0-9]+]], d[[REG]], d1 27*9880d681SAndroid Build Coastguard Worker; GENERIC-NOOPT: fmov [[COPY_REG3:x[0-9]+]], d[[REG3]] 28*9880d681SAndroid Build Coastguard Worker; GENERIC-OPT-NOT: fmov 29*9880d681SAndroid Build Coastguard Worker; GENERIC: fmov [[COPY_REG2:x[0-9]+]], d[[REG2]] 30*9880d681SAndroid Build Coastguard Worker; GENERIC-NOOPT: fmov d0, [[COPY_REG3]] 31*9880d681SAndroid Build Coastguard Worker; GENERIC-OPT-NOT: fmov 32*9880d681SAndroid Build Coastguard Worker; GENERIC: ins v0.d[1], [[COPY_REG2]] 33*9880d681SAndroid Build Coastguard Worker; GENERIC-NEXT: ret 34*9880d681SAndroid Build Coastguard Worker %add = add <2 x i64> %a, %b 35*9880d681SAndroid Build Coastguard Worker %vgetq_lane = extractelement <2 x i64> %add, i32 0 36*9880d681SAndroid Build Coastguard Worker %vgetq_lane2 = extractelement <2 x i64> %b, i32 0 37*9880d681SAndroid Build Coastguard Worker %add3 = add i64 %vgetq_lane, %vgetq_lane2 38*9880d681SAndroid Build Coastguard Worker %sub = sub i64 %vgetq_lane, %vgetq_lane2 39*9880d681SAndroid Build Coastguard Worker %vecinit = insertelement <2 x i64> undef, i64 %add3, i32 0 40*9880d681SAndroid Build Coastguard Worker %vecinit8 = insertelement <2 x i64> %vecinit, i64 %sub, i32 1 41*9880d681SAndroid Build Coastguard Worker ret <2 x i64> %vecinit8 42*9880d681SAndroid Build Coastguard Worker} 43*9880d681SAndroid Build Coastguard Worker 44*9880d681SAndroid Build Coastguard Workerdefine double @subdd_su64(<2 x i64> %a, <2 x i64> %b) nounwind readnone { 45*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: subdd_su64: 46*9880d681SAndroid Build Coastguard Worker; CHECK: sub d0, d1, d0 47*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret 48*9880d681SAndroid Build Coastguard Worker; GENERIC-LABEL: subdd_su64: 49*9880d681SAndroid Build Coastguard Worker; GENERIC: sub d0, d1, d0 50*9880d681SAndroid Build Coastguard Worker; GENERIC-NEXT: ret 51*9880d681SAndroid Build Coastguard Worker %vecext = extractelement <2 x i64> %a, i32 0 52*9880d681SAndroid Build Coastguard Worker %vecext1 = extractelement <2 x i64> %b, i32 0 53*9880d681SAndroid Build Coastguard Worker %sub.i = sub nsw i64 %vecext1, %vecext 54*9880d681SAndroid Build Coastguard Worker %retval = bitcast i64 %sub.i to double 55*9880d681SAndroid Build Coastguard Worker ret double %retval 56*9880d681SAndroid Build Coastguard Worker} 57*9880d681SAndroid Build Coastguard Worker 58*9880d681SAndroid Build Coastguard Workerdefine double @vaddd_su64(<2 x i64> %a, <2 x i64> %b) nounwind readnone { 59*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: vaddd_su64: 60*9880d681SAndroid Build Coastguard Worker; CHECK: add d0, d1, d0 61*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret 62*9880d681SAndroid Build Coastguard Worker; GENERIC-LABEL: vaddd_su64: 63*9880d681SAndroid Build Coastguard Worker; GENERIC: add d0, d1, d0 64*9880d681SAndroid Build Coastguard Worker; GENERIC-NEXT: ret 65*9880d681SAndroid Build Coastguard Worker %vecext = extractelement <2 x i64> %a, i32 0 66*9880d681SAndroid Build Coastguard Worker %vecext1 = extractelement <2 x i64> %b, i32 0 67*9880d681SAndroid Build Coastguard Worker %add.i = add nsw i64 %vecext1, %vecext 68*9880d681SAndroid Build Coastguard Worker %retval = bitcast i64 %add.i to double 69*9880d681SAndroid Build Coastguard Worker ret double %retval 70*9880d681SAndroid Build Coastguard Worker} 71*9880d681SAndroid Build Coastguard Worker 72*9880d681SAndroid Build Coastguard Worker; sub MI doesn't access dsub register. 73*9880d681SAndroid Build Coastguard Workerdefine double @add_sub_su64(<2 x i64> %a, <2 x i64> %b) nounwind readnone { 74*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: add_sub_su64: 75*9880d681SAndroid Build Coastguard Worker; CHECK: add d0, d1, d0 76*9880d681SAndroid Build Coastguard Worker; CHECK: sub d0, {{d[0-9]+}}, d0 77*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret 78*9880d681SAndroid Build Coastguard Worker; GENERIC-LABEL: add_sub_su64: 79*9880d681SAndroid Build Coastguard Worker; GENERIC: add d0, d1, d0 80*9880d681SAndroid Build Coastguard Worker; GENERIC: sub d0, {{d[0-9]+}}, d0 81*9880d681SAndroid Build Coastguard Worker; GENERIC-NEXT: ret 82*9880d681SAndroid Build Coastguard Worker %vecext = extractelement <2 x i64> %a, i32 0 83*9880d681SAndroid Build Coastguard Worker %vecext1 = extractelement <2 x i64> %b, i32 0 84*9880d681SAndroid Build Coastguard Worker %add.i = add i64 %vecext1, %vecext 85*9880d681SAndroid Build Coastguard Worker %sub.i = sub i64 0, %add.i 86*9880d681SAndroid Build Coastguard Worker %retval = bitcast i64 %sub.i to double 87*9880d681SAndroid Build Coastguard Worker ret double %retval 88*9880d681SAndroid Build Coastguard Worker} 89*9880d681SAndroid Build Coastguard Workerdefine double @and_su64(<2 x i64> %a, <2 x i64> %b) nounwind readnone { 90*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: and_su64: 91*9880d681SAndroid Build Coastguard Worker; CHECK: and.8b v0, v1, v0 92*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret 93*9880d681SAndroid Build Coastguard Worker; GENERIC-LABEL: and_su64: 94*9880d681SAndroid Build Coastguard Worker; GENERIC: and v0.8b, v1.8b, v0.8b 95*9880d681SAndroid Build Coastguard Worker; GENERIC-NEXT: ret 96*9880d681SAndroid Build Coastguard Worker %vecext = extractelement <2 x i64> %a, i32 0 97*9880d681SAndroid Build Coastguard Worker %vecext1 = extractelement <2 x i64> %b, i32 0 98*9880d681SAndroid Build Coastguard Worker %or.i = and i64 %vecext1, %vecext 99*9880d681SAndroid Build Coastguard Worker %retval = bitcast i64 %or.i to double 100*9880d681SAndroid Build Coastguard Worker ret double %retval 101*9880d681SAndroid Build Coastguard Worker} 102*9880d681SAndroid Build Coastguard Worker 103*9880d681SAndroid Build Coastguard Workerdefine double @orr_su64(<2 x i64> %a, <2 x i64> %b) nounwind readnone { 104*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: orr_su64: 105*9880d681SAndroid Build Coastguard Worker; CHECK: orr.8b v0, v1, v0 106*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret 107*9880d681SAndroid Build Coastguard Worker; GENERIC-LABEL: orr_su64: 108*9880d681SAndroid Build Coastguard Worker; GENERIC: orr v0.8b, v1.8b, v0.8b 109*9880d681SAndroid Build Coastguard Worker; GENERIC-NEXT: ret 110*9880d681SAndroid Build Coastguard Worker %vecext = extractelement <2 x i64> %a, i32 0 111*9880d681SAndroid Build Coastguard Worker %vecext1 = extractelement <2 x i64> %b, i32 0 112*9880d681SAndroid Build Coastguard Worker %or.i = or i64 %vecext1, %vecext 113*9880d681SAndroid Build Coastguard Worker %retval = bitcast i64 %or.i to double 114*9880d681SAndroid Build Coastguard Worker ret double %retval 115*9880d681SAndroid Build Coastguard Worker} 116*9880d681SAndroid Build Coastguard Worker 117*9880d681SAndroid Build Coastguard Workerdefine double @xorr_su64(<2 x i64> %a, <2 x i64> %b) nounwind readnone { 118*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: xorr_su64: 119*9880d681SAndroid Build Coastguard Worker; CHECK: eor.8b v0, v1, v0 120*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret 121*9880d681SAndroid Build Coastguard Worker; GENERIC-LABEL: xorr_su64: 122*9880d681SAndroid Build Coastguard Worker; GENERIC: eor v0.8b, v1.8b, v0.8b 123*9880d681SAndroid Build Coastguard Worker; GENERIC-NEXT: ret 124*9880d681SAndroid Build Coastguard Worker %vecext = extractelement <2 x i64> %a, i32 0 125*9880d681SAndroid Build Coastguard Worker %vecext1 = extractelement <2 x i64> %b, i32 0 126*9880d681SAndroid Build Coastguard Worker %xor.i = xor i64 %vecext1, %vecext 127*9880d681SAndroid Build Coastguard Worker %retval = bitcast i64 %xor.i to double 128*9880d681SAndroid Build Coastguard Worker ret double %retval 129*9880d681SAndroid Build Coastguard Worker} 130