test/CodeGen/aarch64-neon-fma.c

*67e74705SXin Li// RUN: %clang_cc1 -triple arm64-none-linux-gnu -target-feature +neon -S -emit-llvm -o - %s | opt -S -mem2reg | FileCheck %s
*67e74705SXin Li
*67e74705SXin Li// Test new aarch64 intrinsics and types
*67e74705SXin Li
*67e74705SXin Li#include <arm_neon.h>
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <2 x float> @test_vmla_n_f32(<2 x float> %a, <2 x float> %b, float %c) #0 {
*67e74705SXin Li// CHECK:   [[VECINIT_I:%.*]] = insertelement <2 x float> undef, float %c, i32 0
*67e74705SXin Li// CHECK:   [[VECINIT1_I:%.*]] = insertelement <2 x float> [[VECINIT_I]], float %c, i32 1
*67e74705SXin Li// CHECK:   [[MUL_I:%.*]] = fmul <2 x float> %b, [[VECINIT1_I]]
*67e74705SXin Li// CHECK:   [[ADD_I:%.*]] = fadd <2 x float> %a, [[MUL_I]]
*67e74705SXin Li// CHECK:   ret <2 x float> [[ADD_I]]
*67e74705SXin Lifloat32x2_t test_vmla_n_f32(float32x2_t a, float32x2_t b, float32_t c) {
*67e74705SXin Li  return vmla_n_f32(a, b, c);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <4 x float> @test_vmlaq_n_f32(<4 x float> %a, <4 x float> %b, float %c) #0 {
*67e74705SXin Li// CHECK:   [[VECINIT_I:%.*]] = insertelement <4 x float> undef, float %c, i32 0
*67e74705SXin Li// CHECK:   [[VECINIT1_I:%.*]] = insertelement <4 x float> [[VECINIT_I]], float %c, i32 1
*67e74705SXin Li// CHECK:   [[VECINIT2_I:%.*]] = insertelement <4 x float> [[VECINIT1_I]], float %c, i32 2
*67e74705SXin Li// CHECK:   [[VECINIT3_I:%.*]] = insertelement <4 x float> [[VECINIT2_I]], float %c, i32 3
*67e74705SXin Li// CHECK:   [[MUL_I:%.*]] = fmul <4 x float> %b, [[VECINIT3_I]]
*67e74705SXin Li// CHECK:   [[ADD_I:%.*]] = fadd <4 x float> %a, [[MUL_I]]
*67e74705SXin Li// CHECK:   ret <4 x float> [[ADD_I]]
*67e74705SXin Lifloat32x4_t test_vmlaq_n_f32(float32x4_t a, float32x4_t b, float32_t c) {
*67e74705SXin Li  return vmlaq_n_f32(a, b, c);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <2 x double> @test_vmlaq_n_f64(<2 x double> %a, <2 x double> %b, double %c) #0 {
*67e74705SXin Li// CHECK:   [[VECINIT_I:%.*]] = insertelement <2 x double> undef, double %c, i32 0
*67e74705SXin Li// CHECK:   [[VECINIT1_I:%.*]] = insertelement <2 x double> [[VECINIT_I]], double %c, i32 1
*67e74705SXin Li// CHECK:   [[MUL_I:%.*]] = fmul <2 x double> %b, [[VECINIT1_I]]
*67e74705SXin Li// CHECK:   [[ADD_I:%.*]] = fadd <2 x double> %a, [[MUL_I]]
*67e74705SXin Li// CHECK:   ret <2 x double> [[ADD_I]]
*67e74705SXin Lifloat64x2_t test_vmlaq_n_f64(float64x2_t a, float64x2_t b, float64_t c) {
*67e74705SXin Li  return vmlaq_n_f64(a, b, c);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <4 x float> @test_vmlsq_n_f32(<4 x float> %a, <4 x float> %b, float %c) #0 {
*67e74705SXin Li// CHECK:   [[VECINIT_I:%.*]] = insertelement <4 x float> undef, float %c, i32 0
*67e74705SXin Li// CHECK:   [[VECINIT1_I:%.*]] = insertelement <4 x float> [[VECINIT_I]], float %c, i32 1
*67e74705SXin Li// CHECK:   [[VECINIT2_I:%.*]] = insertelement <4 x float> [[VECINIT1_I]], float %c, i32 2
*67e74705SXin Li// CHECK:   [[VECINIT3_I:%.*]] = insertelement <4 x float> [[VECINIT2_I]], float %c, i32 3
*67e74705SXin Li// CHECK:   [[MUL_I:%.*]] = fmul <4 x float> %b, [[VECINIT3_I]]
*67e74705SXin Li// CHECK:   [[SUB_I:%.*]] = fsub <4 x float> %a, [[MUL_I]]
*67e74705SXin Li// CHECK:   ret <4 x float> [[SUB_I]]
*67e74705SXin Lifloat32x4_t test_vmlsq_n_f32(float32x4_t a, float32x4_t b, float32_t c) {
*67e74705SXin Li  return vmlsq_n_f32(a, b, c);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <2 x float> @test_vmls_n_f32(<2 x float> %a, <2 x float> %b, float %c) #0 {
*67e74705SXin Li// CHECK:   [[VECINIT_I:%.*]] = insertelement <2 x float> undef, float %c, i32 0
*67e74705SXin Li// CHECK:   [[VECINIT1_I:%.*]] = insertelement <2 x float> [[VECINIT_I]], float %c, i32 1
*67e74705SXin Li// CHECK:   [[MUL_I:%.*]] = fmul <2 x float> %b, [[VECINIT1_I]]
*67e74705SXin Li// CHECK:   [[SUB_I:%.*]] = fsub <2 x float> %a, [[MUL_I]]
*67e74705SXin Li// CHECK:   ret <2 x float> [[SUB_I]]
*67e74705SXin Lifloat32x2_t test_vmls_n_f32(float32x2_t a, float32x2_t b, float32_t c) {
*67e74705SXin Li  return vmls_n_f32(a, b, c);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <2 x double> @test_vmlsq_n_f64(<2 x double> %a, <2 x double> %b, double %c) #0 {
*67e74705SXin Li// CHECK:   [[VECINIT_I:%.*]] = insertelement <2 x double> undef, double %c, i32 0
*67e74705SXin Li// CHECK:   [[VECINIT1_I:%.*]] = insertelement <2 x double> [[VECINIT_I]], double %c, i32 1
*67e74705SXin Li// CHECK:   [[MUL_I:%.*]] = fmul <2 x double> %b, [[VECINIT1_I]]
*67e74705SXin Li// CHECK:   [[SUB_I:%.*]] = fsub <2 x double> %a, [[MUL_I]]
*67e74705SXin Li// CHECK:   ret <2 x double> [[SUB_I]]
*67e74705SXin Lifloat64x2_t test_vmlsq_n_f64(float64x2_t a, float64x2_t b, float64_t c) {
*67e74705SXin Li  return vmlsq_n_f64(a, b, c);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <2 x float> @test_vmla_lane_f32_0(<2 x float> %a, <2 x float> %b, <2 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <2 x float> %v, <2 x float> %v, <2 x i32> zeroinitializer
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <2 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[ADD:%.*]] = fadd <2 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <2 x float> [[ADD]]
*67e74705SXin Lifloat32x2_t test_vmla_lane_f32_0(float32x2_t a, float32x2_t b, float32x2_t v) {
*67e74705SXin Li  return vmla_lane_f32(a, b, v, 0);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <4 x float> @test_vmlaq_lane_f32_0(<4 x float> %a, <4 x float> %b, <2 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <2 x float> %v, <2 x float> %v, <4 x i32> zeroinitializer
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <4 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[ADD:%.*]] = fadd <4 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <4 x float> [[ADD]]
*67e74705SXin Lifloat32x4_t test_vmlaq_lane_f32_0(float32x4_t a, float32x4_t b, float32x2_t v) {
*67e74705SXin Li  return vmlaq_lane_f32(a, b, v, 0);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <2 x float> @test_vmla_laneq_f32_0(<2 x float> %a, <2 x float> %b, <4 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <4 x float> %v, <4 x float> %v, <2 x i32> zeroinitializer
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <2 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[ADD:%.*]] = fadd <2 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <2 x float> [[ADD]]
*67e74705SXin Lifloat32x2_t test_vmla_laneq_f32_0(float32x2_t a, float32x2_t b, float32x4_t v) {
*67e74705SXin Li  return vmla_laneq_f32(a, b, v, 0);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <4 x float> @test_vmlaq_laneq_f32_0(<4 x float> %a, <4 x float> %b, <4 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <4 x float> %v, <4 x float> %v, <4 x i32> zeroinitializer
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <4 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[ADD:%.*]] = fadd <4 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <4 x float> [[ADD]]
*67e74705SXin Lifloat32x4_t test_vmlaq_laneq_f32_0(float32x4_t a, float32x4_t b, float32x4_t v) {
*67e74705SXin Li  return vmlaq_laneq_f32(a, b, v, 0);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <2 x float> @test_vmls_lane_f32_0(<2 x float> %a, <2 x float> %b, <2 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <2 x float> %v, <2 x float> %v, <2 x i32> zeroinitializer
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <2 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[SUB:%.*]] = fsub <2 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <2 x float> [[SUB]]
*67e74705SXin Lifloat32x2_t test_vmls_lane_f32_0(float32x2_t a, float32x2_t b, float32x2_t v) {
*67e74705SXin Li  return vmls_lane_f32(a, b, v, 0);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <4 x float> @test_vmlsq_lane_f32_0(<4 x float> %a, <4 x float> %b, <2 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <2 x float> %v, <2 x float> %v, <4 x i32> zeroinitializer
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <4 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[SUB:%.*]] = fsub <4 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <4 x float> [[SUB]]
*67e74705SXin Lifloat32x4_t test_vmlsq_lane_f32_0(float32x4_t a, float32x4_t b, float32x2_t v) {
*67e74705SXin Li  return vmlsq_lane_f32(a, b, v, 0);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <2 x float> @test_vmls_laneq_f32_0(<2 x float> %a, <2 x float> %b, <4 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <4 x float> %v, <4 x float> %v, <2 x i32> zeroinitializer
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <2 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[SUB:%.*]] = fsub <2 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <2 x float> [[SUB]]
*67e74705SXin Lifloat32x2_t test_vmls_laneq_f32_0(float32x2_t a, float32x2_t b, float32x4_t v) {
*67e74705SXin Li  return vmls_laneq_f32(a, b, v, 0);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <4 x float> @test_vmlsq_laneq_f32_0(<4 x float> %a, <4 x float> %b, <4 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <4 x float> %v, <4 x float> %v, <4 x i32> zeroinitializer
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <4 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[SUB:%.*]] = fsub <4 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <4 x float> [[SUB]]
*67e74705SXin Lifloat32x4_t test_vmlsq_laneq_f32_0(float32x4_t a, float32x4_t b, float32x4_t v) {
*67e74705SXin Li  return vmlsq_laneq_f32(a, b, v, 0);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <2 x float> @test_vmla_lane_f32(<2 x float> %a, <2 x float> %b, <2 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <2 x float> %v, <2 x float> %v, <2 x i32> <i32 1, i32 1>
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <2 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[ADD:%.*]] = fadd <2 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <2 x float> [[ADD]]
*67e74705SXin Lifloat32x2_t test_vmla_lane_f32(float32x2_t a, float32x2_t b, float32x2_t v) {
*67e74705SXin Li  return vmla_lane_f32(a, b, v, 1);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <4 x float> @test_vmlaq_lane_f32(<4 x float> %a, <4 x float> %b, <2 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <2 x float> %v, <2 x float> %v, <4 x i32> <i32 1, i32 1, i32 1, i32 1>
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <4 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[ADD:%.*]] = fadd <4 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <4 x float> [[ADD]]
*67e74705SXin Lifloat32x4_t test_vmlaq_lane_f32(float32x4_t a, float32x4_t b, float32x2_t v) {
*67e74705SXin Li  return vmlaq_lane_f32(a, b, v, 1);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <2 x float> @test_vmla_laneq_f32(<2 x float> %a, <2 x float> %b, <4 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <4 x float> %v, <4 x float> %v, <2 x i32> <i32 3, i32 3>
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <2 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[ADD:%.*]] = fadd <2 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <2 x float> [[ADD]]
*67e74705SXin Lifloat32x2_t test_vmla_laneq_f32(float32x2_t a, float32x2_t b, float32x4_t v) {
*67e74705SXin Li  return vmla_laneq_f32(a, b, v, 3);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <4 x float> @test_vmlaq_laneq_f32(<4 x float> %a, <4 x float> %b, <4 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <4 x float> %v, <4 x float> %v, <4 x i32> <i32 3, i32 3, i32 3, i32 3>
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <4 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[ADD:%.*]] = fadd <4 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <4 x float> [[ADD]]
*67e74705SXin Lifloat32x4_t test_vmlaq_laneq_f32(float32x4_t a, float32x4_t b, float32x4_t v) {
*67e74705SXin Li  return vmlaq_laneq_f32(a, b, v, 3);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <2 x float> @test_vmls_lane_f32(<2 x float> %a, <2 x float> %b, <2 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <2 x float> %v, <2 x float> %v, <2 x i32> <i32 1, i32 1>
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <2 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[SUB:%.*]] = fsub <2 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <2 x float> [[SUB]]
*67e74705SXin Lifloat32x2_t test_vmls_lane_f32(float32x2_t a, float32x2_t b, float32x2_t v) {
*67e74705SXin Li  return vmls_lane_f32(a, b, v, 1);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <4 x float> @test_vmlsq_lane_f32(<4 x float> %a, <4 x float> %b, <2 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <2 x float> %v, <2 x float> %v, <4 x i32> <i32 1, i32 1, i32 1, i32 1>
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <4 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[SUB:%.*]] = fsub <4 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <4 x float> [[SUB]]
*67e74705SXin Lifloat32x4_t test_vmlsq_lane_f32(float32x4_t a, float32x4_t b, float32x2_t v) {
*67e74705SXin Li  return vmlsq_lane_f32(a, b, v, 1);
*67e74705SXin Li}
*67e74705SXin Li// CHECK-LABEL: define <2 x float> @test_vmls_laneq_f32(<2 x float> %a, <2 x float> %b, <4 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <4 x float> %v, <4 x float> %v, <2 x i32> <i32 3, i32 3>
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <2 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[SUB:%.*]] = fsub <2 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <2 x float> [[SUB]]
*67e74705SXin Lifloat32x2_t test_vmls_laneq_f32(float32x2_t a, float32x2_t b, float32x4_t v) {
*67e74705SXin Li  return vmls_laneq_f32(a, b, v, 3);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <4 x float> @test_vmlsq_laneq_f32(<4 x float> %a, <4 x float> %b, <4 x float> %v) #0 {
*67e74705SXin Li// CHECK:   [[SHUFFLE:%.*]] = shufflevector <4 x float> %v, <4 x float> %v, <4 x i32> <i32 3, i32 3, i32 3, i32 3>
*67e74705SXin Li// CHECK:   [[MUL:%.*]] = fmul <4 x float> %b, [[SHUFFLE]]
*67e74705SXin Li// CHECK:   [[SUB:%.*]] = fsub <4 x float> %a, [[MUL]]
*67e74705SXin Li// CHECK:   ret <4 x float> [[SUB]]
*67e74705SXin Lifloat32x4_t test_vmlsq_laneq_f32(float32x4_t a, float32x4_t b, float32x4_t v) {
*67e74705SXin Li  return vmlsq_laneq_f32(a, b, v, 3);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <2 x double> @test_vfmaq_n_f64(<2 x double> %a, <2 x double> %b, double %c) #0 {
*67e74705SXin Li// CHECK:   [[VECINIT_I:%.*]] = insertelement <2 x double> undef, double %c, i32 0
*67e74705SXin Li// CHECK:   [[VECINIT1_I:%.*]] = insertelement <2 x double> [[VECINIT_I]], double %c, i32 1
*67e74705SXin Li// CHECK:   [[TMP0:%.*]] = bitcast <2 x double> %a to <16 x i8>
*67e74705SXin Li// CHECK:   [[TMP1:%.*]] = bitcast <2 x double> %b to <16 x i8>
*67e74705SXin Li// CHECK:   [[TMP2:%.*]] = bitcast <2 x double> [[VECINIT1_I]] to <16 x i8>
*67e74705SXin Li// CHECK:   [[TMP3:%.*]] = bitcast <16 x i8> [[TMP0]] to <2 x double>
*67e74705SXin Li// CHECK:   [[TMP4:%.*]] = bitcast <16 x i8> [[TMP1]] to <2 x double>
*67e74705SXin Li// CHECK:   [[TMP5:%.*]] = bitcast <16 x i8> [[TMP2]] to <2 x double>
*67e74705SXin Li// CHECK:   [[TMP6:%.*]] = call <2 x double> @llvm.fma.v2f64(<2 x double> [[TMP4]], <2 x double> [[TMP5]], <2 x double> [[TMP3]]) #2
*67e74705SXin Li// CHECK:   ret <2 x double> [[TMP6]]
*67e74705SXin Lifloat64x2_t test_vfmaq_n_f64(float64x2_t a, float64x2_t b, float64_t c) {
*67e74705SXin Li  return vfmaq_n_f64(a, b, c);
*67e74705SXin Li}
*67e74705SXin Li
*67e74705SXin Li// CHECK-LABEL: define <2 x double> @test_vfmsq_n_f64(<2 x double> %a, <2 x double> %b, double %c) #0 {
*67e74705SXin Li// CHECK:   [[SUB_I:%.*]] = fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %b
*67e74705SXin Li// CHECK:   [[VECINIT_I:%.*]] = insertelement <2 x double> undef, double %c, i32 0
*67e74705SXin Li// CHECK:   [[VECINIT1_I:%.*]] = insertelement <2 x double> [[VECINIT_I]], double %c, i32 1
*67e74705SXin Li// CHECK:   [[TMP0:%.*]] = bitcast <2 x double> %a to <16 x i8>
*67e74705SXin Li// CHECK:   [[TMP1:%.*]] = bitcast <2 x double> [[SUB_I]] to <16 x i8>
*67e74705SXin Li// CHECK:   [[TMP2:%.*]] = bitcast <2 x double> [[VECINIT1_I]] to <16 x i8>
*67e74705SXin Li// CHECK:   [[TMP3:%.*]] = bitcast <16 x i8> [[TMP0]] to <2 x double>
*67e74705SXin Li// CHECK:   [[TMP4:%.*]] = bitcast <16 x i8> [[TMP1]] to <2 x double>
*67e74705SXin Li// CHECK:   [[TMP5:%.*]] = bitcast <16 x i8> [[TMP2]] to <2 x double>
*67e74705SXin Li// CHECK:   [[TMP6:%.*]] = call <2 x double> @llvm.fma.v2f64(<2 x double> [[TMP4]], <2 x double> [[TMP5]], <2 x double> [[TMP3]]) #2
*67e74705SXin Li// CHECK:   ret <2 x double> [[TMP6]]
*67e74705SXin Lifloat64x2_t test_vfmsq_n_f64(float64x2_t a, float64x2_t b, float64_t c) {
*67e74705SXin Li  return vfmsq_n_f64(a, b, c);
*67e74705SXin Li}