1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=x86-64 -mtriple=x86_64-unknown-linux-gnu -mcpu=corei7 -mattr=-f16c -asm-verbose=false -fixup-byte-word-insts=1 \ 2*9880d681SAndroid Build Coastguard Worker; RUN: | FileCheck %s -check-prefix=CHECK -check-prefix=CHECK-LIBCALL -check-prefix=BWON 3*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=x86-64 -mtriple=x86_64-unknown-linux-gnu -mcpu=corei7 -mattr=-f16c -asm-verbose=false -fixup-byte-word-insts=0 \ 4*9880d681SAndroid Build Coastguard Worker; RUN: | FileCheck %s -check-prefix=CHECK -check-prefix=CHECK-LIBCALL -check-prefix=BWOFF 5*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=x86-64 -mtriple=x86_64-unknown-linux-gnu -mcpu=corei7 -mattr=+f16c -asm-verbose=false -fixup-byte-word-insts=1 \ 6*9880d681SAndroid Build Coastguard Worker; RUN: | FileCheck %s -check-prefix=CHECK -check-prefix=CHECK-F16C -check-prefix=BWON 7*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=i686-unknown-linux-gnu -mattr +sse2 -asm-verbose=false -fixup-byte-word-insts=0 \ 8*9880d681SAndroid Build Coastguard Worker; RUN: | FileCheck %s -check-prefix=CHECK-I686 9*9880d681SAndroid Build Coastguard Worker 10*9880d681SAndroid Build Coastguard Workerdefine void @test_load_store(half* %in, half* %out) { 11*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_load_store: 12*9880d681SAndroid Build Coastguard Worker; BWON: movzwl (%rdi), %eax 13*9880d681SAndroid Build Coastguard Worker; BWOFF: movw (%rdi), %ax 14*9880d681SAndroid Build Coastguard Worker; CHECK: movw %ax, (%rsi) 15*9880d681SAndroid Build Coastguard Worker %val = load half, half* %in 16*9880d681SAndroid Build Coastguard Worker store half %val, half* %out 17*9880d681SAndroid Build Coastguard Worker ret void 18*9880d681SAndroid Build Coastguard Worker} 19*9880d681SAndroid Build Coastguard Worker 20*9880d681SAndroid Build Coastguard Workerdefine i16 @test_bitcast_from_half(half* %addr) { 21*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_bitcast_from_half: 22*9880d681SAndroid Build Coastguard Worker; BWON: movzwl (%rdi), %eax 23*9880d681SAndroid Build Coastguard Worker; BWOFF: movw (%rdi), %ax 24*9880d681SAndroid Build Coastguard Worker %val = load half, half* %addr 25*9880d681SAndroid Build Coastguard Worker %val_int = bitcast half %val to i16 26*9880d681SAndroid Build Coastguard Worker ret i16 %val_int 27*9880d681SAndroid Build Coastguard Worker} 28*9880d681SAndroid Build Coastguard Worker 29*9880d681SAndroid Build Coastguard Workerdefine void @test_bitcast_to_half(half* %addr, i16 %in) { 30*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_bitcast_to_half: 31*9880d681SAndroid Build Coastguard Worker; CHECK: movw %si, (%rdi) 32*9880d681SAndroid Build Coastguard Worker %val_fp = bitcast i16 %in to half 33*9880d681SAndroid Build Coastguard Worker store half %val_fp, half* %addr 34*9880d681SAndroid Build Coastguard Worker ret void 35*9880d681SAndroid Build Coastguard Worker} 36*9880d681SAndroid Build Coastguard Worker 37*9880d681SAndroid Build Coastguard Workerdefine float @test_extend32(half* %addr) { 38*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_extend32: 39*9880d681SAndroid Build Coastguard Worker 40*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: jmp __gnu_h2f_ieee 41*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtph2ps 42*9880d681SAndroid Build Coastguard Worker %val16 = load half, half* %addr 43*9880d681SAndroid Build Coastguard Worker %val32 = fpext half %val16 to float 44*9880d681SAndroid Build Coastguard Worker ret float %val32 45*9880d681SAndroid Build Coastguard Worker} 46*9880d681SAndroid Build Coastguard Worker 47*9880d681SAndroid Build Coastguard Workerdefine double @test_extend64(half* %addr) { 48*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_extend64: 49*9880d681SAndroid Build Coastguard Worker 50*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: callq __gnu_h2f_ieee 51*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: cvtss2sd 52*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtph2ps 53*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtss2sd 54*9880d681SAndroid Build Coastguard Worker %val16 = load half, half* %addr 55*9880d681SAndroid Build Coastguard Worker %val32 = fpext half %val16 to double 56*9880d681SAndroid Build Coastguard Worker ret double %val32 57*9880d681SAndroid Build Coastguard Worker} 58*9880d681SAndroid Build Coastguard Worker 59*9880d681SAndroid Build Coastguard Workerdefine void @test_trunc32(float %in, half* %addr) { 60*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_trunc32: 61*9880d681SAndroid Build Coastguard Worker 62*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: callq __gnu_f2h_ieee 63*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtps2ph 64*9880d681SAndroid Build Coastguard Worker %val16 = fptrunc float %in to half 65*9880d681SAndroid Build Coastguard Worker store half %val16, half* %addr 66*9880d681SAndroid Build Coastguard Worker ret void 67*9880d681SAndroid Build Coastguard Worker} 68*9880d681SAndroid Build Coastguard Worker 69*9880d681SAndroid Build Coastguard Workerdefine void @test_trunc64(double %in, half* %addr) { 70*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_trunc64: 71*9880d681SAndroid Build Coastguard Worker 72*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: callq __truncdfhf2 73*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: callq __truncdfhf2 74*9880d681SAndroid Build Coastguard Worker %val16 = fptrunc double %in to half 75*9880d681SAndroid Build Coastguard Worker store half %val16, half* %addr 76*9880d681SAndroid Build Coastguard Worker ret void 77*9880d681SAndroid Build Coastguard Worker} 78*9880d681SAndroid Build Coastguard Worker 79*9880d681SAndroid Build Coastguard Workerdefine i64 @test_fptosi_i64(half* %p) #0 { 80*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_fptosi_i64: 81*9880d681SAndroid Build Coastguard Worker 82*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: pushq %rax 83*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: movzwl (%rdi), %edi 84*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: callq __gnu_h2f_ieee 85*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: cvttss2si %xmm0, %rax 86*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: popq %rcx 87*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: retq 88*9880d681SAndroid Build Coastguard Worker 89*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: movswl (%rdi), [[REG0:%[a-z0-9]+]] 90*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vmovd [[REG0]], [[REG1:%[a-z0-9]+]] 91*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvtph2ps [[REG1]], [[REG2:%[a-z0-9]+]] 92*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvttss2si [[REG2]], %rax 93*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: retq 94*9880d681SAndroid Build Coastguard Worker %a = load half, half* %p, align 2 95*9880d681SAndroid Build Coastguard Worker %r = fptosi half %a to i64 96*9880d681SAndroid Build Coastguard Worker ret i64 %r 97*9880d681SAndroid Build Coastguard Worker} 98*9880d681SAndroid Build Coastguard Worker 99*9880d681SAndroid Build Coastguard Workerdefine void @test_sitofp_i64(i64 %a, half* %p) #0 { 100*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_sitofp_i64: 101*9880d681SAndroid Build Coastguard Worker 102*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: pushq [[ADDR:%[a-z]+]] 103*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: movq %rsi, [[ADDR]] 104*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: cvtsi2ssq %rdi, %xmm0 105*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: callq __gnu_f2h_ieee 106*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: movw %ax, ([[ADDR]]) 107*9880d681SAndroid Build Coastguard Worker; CHECK_LIBCALL-NEXT: popq [[ADDR]] 108*9880d681SAndroid Build Coastguard Worker; CHECK_LIBCALL-NEXT: retq 109*9880d681SAndroid Build Coastguard Worker 110*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvtsi2ssq %rdi, [[REG0:%[a-z0-9]+]], [[REG0]] 111*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvtps2ph $4, [[REG0]], [[REG0]] 112*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vmovd [[REG0]], %eax 113*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: movw %ax, (%rsi) 114*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: retq 115*9880d681SAndroid Build Coastguard Worker %r = sitofp i64 %a to half 116*9880d681SAndroid Build Coastguard Worker store half %r, half* %p 117*9880d681SAndroid Build Coastguard Worker ret void 118*9880d681SAndroid Build Coastguard Worker} 119*9880d681SAndroid Build Coastguard Worker 120*9880d681SAndroid Build Coastguard Workerdefine i64 @test_fptoui_i64(half* %p) #0 { 121*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_fptoui_i64: 122*9880d681SAndroid Build Coastguard Worker 123*9880d681SAndroid Build Coastguard Worker; FP_TO_UINT is expanded using FP_TO_SINT 124*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: pushq %rax 125*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: movzwl (%rdi), %edi 126*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: callq __gnu_h2f_ieee 127*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: movss {{.[A-Z_0-9]+}}(%rip), [[REG1:%[a-z0-9]+]] 128*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: movaps %xmm0, [[REG2:%[a-z0-9]+]] 129*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: subss [[REG1]], [[REG2]] 130*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: cvttss2si [[REG2]], [[REG3:%[a-z0-9]+]] 131*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: movabsq $-9223372036854775808, [[REG4:%[a-z0-9]+]] 132*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: xorq [[REG3]], [[REG4]] 133*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: cvttss2si %xmm0, [[REG5:%[a-z0-9]+]] 134*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: ucomiss [[REG1]], %xmm0 135*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: cmovaeq [[REG4]], [[REG5]] 136*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: popq %rcx 137*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: retq 138*9880d681SAndroid Build Coastguard Worker 139*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: movswl (%rdi), [[REG0:%[a-z0-9]+]] 140*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vmovd [[REG0]], [[REG1:%[a-z0-9]+]] 141*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvtph2ps [[REG1]], [[REG2:%[a-z0-9]+]] 142*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vmovss {{.[A-Z_0-9]+}}(%rip), [[REG3:%[a-z0-9]+]] 143*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vsubss [[REG3]], [[REG2]], [[REG4:%[a-z0-9]+]] 144*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvttss2si [[REG4]], [[REG5:%[a-z0-9]+]] 145*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: movabsq $-9223372036854775808, [[REG6:%[a-z0-9]+]] 146*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: xorq [[REG5]], [[REG6:%[a-z0-9]+]] 147*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvttss2si [[REG2]], [[REG7:%[a-z0-9]+]] 148*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vucomiss [[REG3]], [[REG2]] 149*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: cmovaeq [[REG6]], %rax 150*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: retq 151*9880d681SAndroid Build Coastguard Worker %a = load half, half* %p, align 2 152*9880d681SAndroid Build Coastguard Worker %r = fptoui half %a to i64 153*9880d681SAndroid Build Coastguard Worker ret i64 %r 154*9880d681SAndroid Build Coastguard Worker} 155*9880d681SAndroid Build Coastguard Worker 156*9880d681SAndroid Build Coastguard Workerdefine void @test_uitofp_i64(i64 %a, half* %p) #0 { 157*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_uitofp_i64: 158*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: pushq [[ADDR:%[a-z0-9]+]] 159*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: movq %rsi, [[ADDR]] 160*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: movl %edi, [[REG0:%[a-z0-9]+]] 161*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: andl $1, [[REG0]] 162*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: testq %rdi, %rdi 163*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: js [[LABEL1:.LBB[0-9_]+]] 164*9880d681SAndroid Build Coastguard Worker 165*9880d681SAndroid Build Coastguard Worker; simple conversion to float if non-negative 166*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: cvtsi2ssq %rdi, [[REG1:%[a-z0-9]+]] 167*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvtsi2ssq %rdi, [[REG1:%[a-z0-9]+]], [[REG1]] 168*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: jmp [[LABEL2:.LBB[0-9_]+]] 169*9880d681SAndroid Build Coastguard Worker 170*9880d681SAndroid Build Coastguard Worker; convert using shift+or if negative 171*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: [[LABEL1]]: 172*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: shrq %rdi 173*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: orq %rdi, [[REG2:%[a-z0-9]+]] 174*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: cvtsi2ssq [[REG2]], [[REG3:%[a-z0-9]+]] 175*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: addss [[REG3]], [[REG1]] 176*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvtsi2ssq [[REG2]], [[REG3:%[a-z0-9]+]], [[REG3]] 177*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vaddss [[REG3]], [[REG3]], [[REG1:[%a-z0-9]+]] 178*9880d681SAndroid Build Coastguard Worker 179*9880d681SAndroid Build Coastguard Worker; convert float to half 180*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: [[LABEL2]]: 181*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: callq __gnu_f2h_ieee 182*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: movw %ax, ([[ADDR]]) 183*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: popq [[ADDR]] 184*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvtps2ph $4, [[REG1]], [[REG4:%[a-z0-9]+]] 185*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vmovd [[REG4]], %eax 186*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: movw %ax, (%rsi) 187*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 188*9880d681SAndroid Build Coastguard Worker 189*9880d681SAndroid Build Coastguard Worker %r = uitofp i64 %a to half 190*9880d681SAndroid Build Coastguard Worker store half %r, half* %p 191*9880d681SAndroid Build Coastguard Worker ret void 192*9880d681SAndroid Build Coastguard Worker} 193*9880d681SAndroid Build Coastguard Worker 194*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_extend32_vec4(<4 x half>* %p) #0 { 195*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_extend32_vec4: 196*9880d681SAndroid Build Coastguard Worker 197*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: callq __gnu_h2f_ieee 198*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: callq __gnu_h2f_ieee 199*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: callq __gnu_h2f_ieee 200*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: callq __gnu_h2f_ieee 201*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtph2ps 202*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtph2ps 203*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtph2ps 204*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtph2ps 205*9880d681SAndroid Build Coastguard Worker %a = load <4 x half>, <4 x half>* %p, align 8 206*9880d681SAndroid Build Coastguard Worker %b = fpext <4 x half> %a to <4 x float> 207*9880d681SAndroid Build Coastguard Worker ret <4 x float> %b 208*9880d681SAndroid Build Coastguard Worker} 209*9880d681SAndroid Build Coastguard Worker 210*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_extend64_vec4(<4 x half>* %p) #0 { 211*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_extend64_vec4 212*9880d681SAndroid Build Coastguard Worker 213*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: callq __gnu_h2f_ieee 214*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-DAG: callq __gnu_h2f_ieee 215*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-DAG: callq __gnu_h2f_ieee 216*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-DAG: callq __gnu_h2f_ieee 217*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-DAG: cvtss2sd 218*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-DAG: cvtss2sd 219*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-DAG: cvtss2sd 220*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: cvtss2sd 221*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtph2ps 222*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-DAG: vcvtph2ps 223*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-DAG: vcvtph2ps 224*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-DAG: vcvtph2ps 225*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-DAG: vcvtss2sd 226*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-DAG: vcvtss2sd 227*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-DAG: vcvtss2sd 228*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtss2sd 229*9880d681SAndroid Build Coastguard Worker %a = load <4 x half>, <4 x half>* %p, align 8 230*9880d681SAndroid Build Coastguard Worker %b = fpext <4 x half> %a to <4 x double> 231*9880d681SAndroid Build Coastguard Worker ret <4 x double> %b 232*9880d681SAndroid Build Coastguard Worker} 233*9880d681SAndroid Build Coastguard Worker 234*9880d681SAndroid Build Coastguard Workerdefine void @test_trunc32_vec4(<4 x float> %a, <4 x half>* %p) { 235*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_trunc32_vec4: 236*9880d681SAndroid Build Coastguard Worker 237*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: callq __gnu_f2h_ieee 238*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: callq __gnu_f2h_ieee 239*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: callq __gnu_f2h_ieee 240*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL: callq __gnu_f2h_ieee 241*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtps2ph 242*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtps2ph 243*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtps2ph 244*9880d681SAndroid Build Coastguard Worker; CHECK-F16C: vcvtps2ph 245*9880d681SAndroid Build Coastguard Worker; CHECK: movw 246*9880d681SAndroid Build Coastguard Worker; CHECK: movw 247*9880d681SAndroid Build Coastguard Worker; CHECK: movw 248*9880d681SAndroid Build Coastguard Worker; CHECK: movw 249*9880d681SAndroid Build Coastguard Worker %v = fptrunc <4 x float> %a to <4 x half> 250*9880d681SAndroid Build Coastguard Worker store <4 x half> %v, <4 x half>* %p 251*9880d681SAndroid Build Coastguard Worker ret void 252*9880d681SAndroid Build Coastguard Worker} 253*9880d681SAndroid Build Coastguard Worker 254*9880d681SAndroid Build Coastguard Workerdefine void @test_trunc64_vec4(<4 x double> %a, <4 x half>* %p) { 255*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_trunc64_vec4: 256*9880d681SAndroid Build Coastguard Worker; CHECK: callq __truncdfhf2 257*9880d681SAndroid Build Coastguard Worker; CHECK: callq __truncdfhf2 258*9880d681SAndroid Build Coastguard Worker; CHECK: callq __truncdfhf2 259*9880d681SAndroid Build Coastguard Worker; CHECK: callq __truncdfhf2 260*9880d681SAndroid Build Coastguard Worker; CHECK: movw 261*9880d681SAndroid Build Coastguard Worker; CHECK: movw 262*9880d681SAndroid Build Coastguard Worker; CHECK: movw 263*9880d681SAndroid Build Coastguard Worker; CHECK: movw 264*9880d681SAndroid Build Coastguard Worker %v = fptrunc <4 x double> %a to <4 x half> 265*9880d681SAndroid Build Coastguard Worker store <4 x half> %v, <4 x half>* %p 266*9880d681SAndroid Build Coastguard Worker ret void 267*9880d681SAndroid Build Coastguard Worker} 268*9880d681SAndroid Build Coastguard Worker 269*9880d681SAndroid Build Coastguard Workerdeclare float @test_floatret(); 270*9880d681SAndroid Build Coastguard Worker 271*9880d681SAndroid Build Coastguard Worker; On i686, if SSE2 is available, the return value from test_floatret is loaded 272*9880d681SAndroid Build Coastguard Worker; to f80 and then rounded to f32. The DAG combiner should not combine this 273*9880d681SAndroid Build Coastguard Worker; fp_round and the subsequent fptrunc from float to half. 274*9880d681SAndroid Build Coastguard Workerdefine half @test_f80trunc_nodagcombine() #0 { 275*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_f80trunc_nodagcombine: 276*9880d681SAndroid Build Coastguard Worker; CHECK-I686-NOT: calll __truncxfhf2 277*9880d681SAndroid Build Coastguard Worker %1 = call float @test_floatret() 278*9880d681SAndroid Build Coastguard Worker %2 = fptrunc float %1 to half 279*9880d681SAndroid Build Coastguard Worker ret half %2 280*9880d681SAndroid Build Coastguard Worker} 281*9880d681SAndroid Build Coastguard Worker 282*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: test_sitofp_fadd_i32: 283*9880d681SAndroid Build Coastguard Worker 284*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: pushq %rbx 285*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: subq $16, %rsp 286*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: movl %edi, %ebx 287*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: movzwl (%rsi), %edi 288*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: callq __gnu_h2f_ieee 289*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: movss %xmm0, 12(%rsp) 290*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: cvtsi2ssl %ebx, %xmm0 291*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: callq __gnu_f2h_ieee 292*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: movzwl %ax, %edi 293*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: callq __gnu_h2f_ieee 294*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: addss 12(%rsp), %xmm0 295*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: addq $16, %rsp 296*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: popq %rbx 297*9880d681SAndroid Build Coastguard Worker; CHECK-LIBCALL-NEXT: retq 298*9880d681SAndroid Build Coastguard Worker 299*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: movswl (%rsi), %eax 300*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vmovd %eax, %xmm0 301*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvtph2ps %xmm0, %xmm0 302*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvtsi2ssl %edi, %xmm0, %xmm1 303*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvtps2ph $4, %xmm1, %xmm1 304*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vcvtph2ps %xmm1, %xmm1 305*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: vaddss %xmm1, %xmm0, %xmm0 306*9880d681SAndroid Build Coastguard Worker; CHECK-F16C-NEXT: retq 307*9880d681SAndroid Build Coastguard Worker 308*9880d681SAndroid Build Coastguard Workerdefine float @test_sitofp_fadd_i32(i32 %a, half* %b) #0 { 309*9880d681SAndroid Build Coastguard Worker %tmp0 = load half, half* %b 310*9880d681SAndroid Build Coastguard Worker %tmp1 = sitofp i32 %a to half 311*9880d681SAndroid Build Coastguard Worker %tmp2 = fadd half %tmp0, %tmp1 312*9880d681SAndroid Build Coastguard Worker %tmp3 = fpext half %tmp2 to float 313*9880d681SAndroid Build Coastguard Worker ret float %tmp3 314*9880d681SAndroid Build Coastguard Worker} 315*9880d681SAndroid Build Coastguard Worker 316*9880d681SAndroid Build Coastguard Workerattributes #0 = { nounwind } 317