1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=x86 -mattr=+mmx,+sse2 | FileCheck -check-prefix=X32 %s 2*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=x86-64 -mattr=+mmx,+sse2 | FileCheck -check-prefix=X64 %s 3*9880d681SAndroid Build Coastguard Worker 4*9880d681SAndroid Build Coastguard Worker;; A basic sanity check to make sure that MMX arithmetic actually compiles. 5*9880d681SAndroid Build Coastguard Worker;; First is a straight translation of the original with bitcasts as needed. 6*9880d681SAndroid Build Coastguard Worker 7*9880d681SAndroid Build Coastguard Worker; X32-LABEL: test0 8*9880d681SAndroid Build Coastguard Worker; X64-LABEL: test0 9*9880d681SAndroid Build Coastguard Workerdefine void @test0(x86_mmx* %A, x86_mmx* %B) { 10*9880d681SAndroid Build Coastguard Workerentry: 11*9880d681SAndroid Build Coastguard Worker %tmp1 = load x86_mmx, x86_mmx* %A 12*9880d681SAndroid Build Coastguard Worker %tmp3 = load x86_mmx, x86_mmx* %B 13*9880d681SAndroid Build Coastguard Worker %tmp1a = bitcast x86_mmx %tmp1 to <8 x i8> 14*9880d681SAndroid Build Coastguard Worker %tmp3a = bitcast x86_mmx %tmp3 to <8 x i8> 15*9880d681SAndroid Build Coastguard Worker %tmp4 = add <8 x i8> %tmp1a, %tmp3a 16*9880d681SAndroid Build Coastguard Worker %tmp4a = bitcast <8 x i8> %tmp4 to x86_mmx 17*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp4a, x86_mmx* %A 18*9880d681SAndroid Build Coastguard Worker %tmp7 = load x86_mmx, x86_mmx* %B 19*9880d681SAndroid Build Coastguard Worker %tmp12 = tail call x86_mmx @llvm.x86.mmx.padds.b(x86_mmx %tmp4a, x86_mmx %tmp7) 20*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp12, x86_mmx* %A 21*9880d681SAndroid Build Coastguard Worker %tmp16 = load x86_mmx, x86_mmx* %B 22*9880d681SAndroid Build Coastguard Worker %tmp21 = tail call x86_mmx @llvm.x86.mmx.paddus.b(x86_mmx %tmp12, x86_mmx %tmp16) 23*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp21, x86_mmx* %A 24*9880d681SAndroid Build Coastguard Worker %tmp27 = load x86_mmx, x86_mmx* %B 25*9880d681SAndroid Build Coastguard Worker %tmp21a = bitcast x86_mmx %tmp21 to <8 x i8> 26*9880d681SAndroid Build Coastguard Worker %tmp27a = bitcast x86_mmx %tmp27 to <8 x i8> 27*9880d681SAndroid Build Coastguard Worker %tmp28 = sub <8 x i8> %tmp21a, %tmp27a 28*9880d681SAndroid Build Coastguard Worker %tmp28a = bitcast <8 x i8> %tmp28 to x86_mmx 29*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp28a, x86_mmx* %A 30*9880d681SAndroid Build Coastguard Worker %tmp31 = load x86_mmx, x86_mmx* %B 31*9880d681SAndroid Build Coastguard Worker %tmp36 = tail call x86_mmx @llvm.x86.mmx.psubs.b(x86_mmx %tmp28a, x86_mmx %tmp31) 32*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp36, x86_mmx* %A 33*9880d681SAndroid Build Coastguard Worker %tmp40 = load x86_mmx, x86_mmx* %B 34*9880d681SAndroid Build Coastguard Worker %tmp45 = tail call x86_mmx @llvm.x86.mmx.psubus.b(x86_mmx %tmp36, x86_mmx %tmp40) 35*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp45, x86_mmx* %A 36*9880d681SAndroid Build Coastguard Worker %tmp51 = load x86_mmx, x86_mmx* %B 37*9880d681SAndroid Build Coastguard Worker %tmp45a = bitcast x86_mmx %tmp45 to <8 x i8> 38*9880d681SAndroid Build Coastguard Worker %tmp51a = bitcast x86_mmx %tmp51 to <8 x i8> 39*9880d681SAndroid Build Coastguard Worker %tmp52 = mul <8 x i8> %tmp45a, %tmp51a 40*9880d681SAndroid Build Coastguard Worker %tmp52a = bitcast <8 x i8> %tmp52 to x86_mmx 41*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp52a, x86_mmx* %A 42*9880d681SAndroid Build Coastguard Worker %tmp57 = load x86_mmx, x86_mmx* %B 43*9880d681SAndroid Build Coastguard Worker %tmp57a = bitcast x86_mmx %tmp57 to <8 x i8> 44*9880d681SAndroid Build Coastguard Worker %tmp58 = and <8 x i8> %tmp52, %tmp57a 45*9880d681SAndroid Build Coastguard Worker %tmp58a = bitcast <8 x i8> %tmp58 to x86_mmx 46*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp58a, x86_mmx* %A 47*9880d681SAndroid Build Coastguard Worker %tmp63 = load x86_mmx, x86_mmx* %B 48*9880d681SAndroid Build Coastguard Worker %tmp63a = bitcast x86_mmx %tmp63 to <8 x i8> 49*9880d681SAndroid Build Coastguard Worker %tmp64 = or <8 x i8> %tmp58, %tmp63a 50*9880d681SAndroid Build Coastguard Worker %tmp64a = bitcast <8 x i8> %tmp64 to x86_mmx 51*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp64a, x86_mmx* %A 52*9880d681SAndroid Build Coastguard Worker %tmp69 = load x86_mmx, x86_mmx* %B 53*9880d681SAndroid Build Coastguard Worker %tmp69a = bitcast x86_mmx %tmp69 to <8 x i8> 54*9880d681SAndroid Build Coastguard Worker %tmp64b = bitcast x86_mmx %tmp64a to <8 x i8> 55*9880d681SAndroid Build Coastguard Worker %tmp70 = xor <8 x i8> %tmp64b, %tmp69a 56*9880d681SAndroid Build Coastguard Worker %tmp70a = bitcast <8 x i8> %tmp70 to x86_mmx 57*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp70a, x86_mmx* %A 58*9880d681SAndroid Build Coastguard Worker tail call void @llvm.x86.mmx.emms() 59*9880d681SAndroid Build Coastguard Worker ret void 60*9880d681SAndroid Build Coastguard Worker} 61*9880d681SAndroid Build Coastguard Worker 62*9880d681SAndroid Build Coastguard Worker; X32-LABEL: test1 63*9880d681SAndroid Build Coastguard Worker; X64-LABEL: test1 64*9880d681SAndroid Build Coastguard Workerdefine void @test1(x86_mmx* %A, x86_mmx* %B) { 65*9880d681SAndroid Build Coastguard Workerentry: 66*9880d681SAndroid Build Coastguard Worker %tmp1 = load x86_mmx, x86_mmx* %A 67*9880d681SAndroid Build Coastguard Worker %tmp3 = load x86_mmx, x86_mmx* %B 68*9880d681SAndroid Build Coastguard Worker %tmp1a = bitcast x86_mmx %tmp1 to <2 x i32> 69*9880d681SAndroid Build Coastguard Worker %tmp3a = bitcast x86_mmx %tmp3 to <2 x i32> 70*9880d681SAndroid Build Coastguard Worker %tmp4 = add <2 x i32> %tmp1a, %tmp3a 71*9880d681SAndroid Build Coastguard Worker %tmp4a = bitcast <2 x i32> %tmp4 to x86_mmx 72*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp4a, x86_mmx* %A 73*9880d681SAndroid Build Coastguard Worker %tmp9 = load x86_mmx, x86_mmx* %B 74*9880d681SAndroid Build Coastguard Worker %tmp9a = bitcast x86_mmx %tmp9 to <2 x i32> 75*9880d681SAndroid Build Coastguard Worker %tmp10 = sub <2 x i32> %tmp4, %tmp9a 76*9880d681SAndroid Build Coastguard Worker %tmp10a = bitcast <2 x i32> %tmp4 to x86_mmx 77*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp10a, x86_mmx* %A 78*9880d681SAndroid Build Coastguard Worker %tmp15 = load x86_mmx, x86_mmx* %B 79*9880d681SAndroid Build Coastguard Worker %tmp10b = bitcast x86_mmx %tmp10a to <2 x i32> 80*9880d681SAndroid Build Coastguard Worker %tmp15a = bitcast x86_mmx %tmp15 to <2 x i32> 81*9880d681SAndroid Build Coastguard Worker %tmp16 = mul <2 x i32> %tmp10b, %tmp15a 82*9880d681SAndroid Build Coastguard Worker %tmp16a = bitcast <2 x i32> %tmp16 to x86_mmx 83*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp16a, x86_mmx* %A 84*9880d681SAndroid Build Coastguard Worker %tmp21 = load x86_mmx, x86_mmx* %B 85*9880d681SAndroid Build Coastguard Worker %tmp16b = bitcast x86_mmx %tmp16a to <2 x i32> 86*9880d681SAndroid Build Coastguard Worker %tmp21a = bitcast x86_mmx %tmp21 to <2 x i32> 87*9880d681SAndroid Build Coastguard Worker %tmp22 = and <2 x i32> %tmp16b, %tmp21a 88*9880d681SAndroid Build Coastguard Worker %tmp22a = bitcast <2 x i32> %tmp22 to x86_mmx 89*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp22a, x86_mmx* %A 90*9880d681SAndroid Build Coastguard Worker %tmp27 = load x86_mmx, x86_mmx* %B 91*9880d681SAndroid Build Coastguard Worker %tmp22b = bitcast x86_mmx %tmp22a to <2 x i32> 92*9880d681SAndroid Build Coastguard Worker %tmp27a = bitcast x86_mmx %tmp27 to <2 x i32> 93*9880d681SAndroid Build Coastguard Worker %tmp28 = or <2 x i32> %tmp22b, %tmp27a 94*9880d681SAndroid Build Coastguard Worker %tmp28a = bitcast <2 x i32> %tmp28 to x86_mmx 95*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp28a, x86_mmx* %A 96*9880d681SAndroid Build Coastguard Worker %tmp33 = load x86_mmx, x86_mmx* %B 97*9880d681SAndroid Build Coastguard Worker %tmp28b = bitcast x86_mmx %tmp28a to <2 x i32> 98*9880d681SAndroid Build Coastguard Worker %tmp33a = bitcast x86_mmx %tmp33 to <2 x i32> 99*9880d681SAndroid Build Coastguard Worker %tmp34 = xor <2 x i32> %tmp28b, %tmp33a 100*9880d681SAndroid Build Coastguard Worker %tmp34a = bitcast <2 x i32> %tmp34 to x86_mmx 101*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp34a, x86_mmx* %A 102*9880d681SAndroid Build Coastguard Worker tail call void @llvm.x86.mmx.emms( ) 103*9880d681SAndroid Build Coastguard Worker ret void 104*9880d681SAndroid Build Coastguard Worker} 105*9880d681SAndroid Build Coastguard Worker 106*9880d681SAndroid Build Coastguard Worker; X32-LABEL: test2 107*9880d681SAndroid Build Coastguard Worker; X64-LABEL: test2 108*9880d681SAndroid Build Coastguard Workerdefine void @test2(x86_mmx* %A, x86_mmx* %B) { 109*9880d681SAndroid Build Coastguard Workerentry: 110*9880d681SAndroid Build Coastguard Worker %tmp1 = load x86_mmx, x86_mmx* %A 111*9880d681SAndroid Build Coastguard Worker %tmp3 = load x86_mmx, x86_mmx* %B 112*9880d681SAndroid Build Coastguard Worker %tmp1a = bitcast x86_mmx %tmp1 to <4 x i16> 113*9880d681SAndroid Build Coastguard Worker %tmp3a = bitcast x86_mmx %tmp3 to <4 x i16> 114*9880d681SAndroid Build Coastguard Worker %tmp4 = add <4 x i16> %tmp1a, %tmp3a 115*9880d681SAndroid Build Coastguard Worker %tmp4a = bitcast <4 x i16> %tmp4 to x86_mmx 116*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp4a, x86_mmx* %A 117*9880d681SAndroid Build Coastguard Worker %tmp7 = load x86_mmx, x86_mmx* %B 118*9880d681SAndroid Build Coastguard Worker %tmp12 = tail call x86_mmx @llvm.x86.mmx.padds.w(x86_mmx %tmp4a, x86_mmx %tmp7) 119*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp12, x86_mmx* %A 120*9880d681SAndroid Build Coastguard Worker %tmp16 = load x86_mmx, x86_mmx* %B 121*9880d681SAndroid Build Coastguard Worker %tmp21 = tail call x86_mmx @llvm.x86.mmx.paddus.w(x86_mmx %tmp12, x86_mmx %tmp16) 122*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp21, x86_mmx* %A 123*9880d681SAndroid Build Coastguard Worker %tmp27 = load x86_mmx, x86_mmx* %B 124*9880d681SAndroid Build Coastguard Worker %tmp21a = bitcast x86_mmx %tmp21 to <4 x i16> 125*9880d681SAndroid Build Coastguard Worker %tmp27a = bitcast x86_mmx %tmp27 to <4 x i16> 126*9880d681SAndroid Build Coastguard Worker %tmp28 = sub <4 x i16> %tmp21a, %tmp27a 127*9880d681SAndroid Build Coastguard Worker %tmp28a = bitcast <4 x i16> %tmp28 to x86_mmx 128*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp28a, x86_mmx* %A 129*9880d681SAndroid Build Coastguard Worker %tmp31 = load x86_mmx, x86_mmx* %B 130*9880d681SAndroid Build Coastguard Worker %tmp36 = tail call x86_mmx @llvm.x86.mmx.psubs.w(x86_mmx %tmp28a, x86_mmx %tmp31) 131*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp36, x86_mmx* %A 132*9880d681SAndroid Build Coastguard Worker %tmp40 = load x86_mmx, x86_mmx* %B 133*9880d681SAndroid Build Coastguard Worker %tmp45 = tail call x86_mmx @llvm.x86.mmx.psubus.w(x86_mmx %tmp36, x86_mmx %tmp40) 134*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp45, x86_mmx* %A 135*9880d681SAndroid Build Coastguard Worker %tmp51 = load x86_mmx, x86_mmx* %B 136*9880d681SAndroid Build Coastguard Worker %tmp45a = bitcast x86_mmx %tmp45 to <4 x i16> 137*9880d681SAndroid Build Coastguard Worker %tmp51a = bitcast x86_mmx %tmp51 to <4 x i16> 138*9880d681SAndroid Build Coastguard Worker %tmp52 = mul <4 x i16> %tmp45a, %tmp51a 139*9880d681SAndroid Build Coastguard Worker %tmp52a = bitcast <4 x i16> %tmp52 to x86_mmx 140*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp52a, x86_mmx* %A 141*9880d681SAndroid Build Coastguard Worker %tmp55 = load x86_mmx, x86_mmx* %B 142*9880d681SAndroid Build Coastguard Worker %tmp60 = tail call x86_mmx @llvm.x86.mmx.pmulh.w(x86_mmx %tmp52a, x86_mmx %tmp55) 143*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp60, x86_mmx* %A 144*9880d681SAndroid Build Coastguard Worker %tmp64 = load x86_mmx, x86_mmx* %B 145*9880d681SAndroid Build Coastguard Worker %tmp69 = tail call x86_mmx @llvm.x86.mmx.pmadd.wd(x86_mmx %tmp60, x86_mmx %tmp64) 146*9880d681SAndroid Build Coastguard Worker %tmp70 = bitcast x86_mmx %tmp69 to x86_mmx 147*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp70, x86_mmx* %A 148*9880d681SAndroid Build Coastguard Worker %tmp75 = load x86_mmx, x86_mmx* %B 149*9880d681SAndroid Build Coastguard Worker %tmp70a = bitcast x86_mmx %tmp70 to <4 x i16> 150*9880d681SAndroid Build Coastguard Worker %tmp75a = bitcast x86_mmx %tmp75 to <4 x i16> 151*9880d681SAndroid Build Coastguard Worker %tmp76 = and <4 x i16> %tmp70a, %tmp75a 152*9880d681SAndroid Build Coastguard Worker %tmp76a = bitcast <4 x i16> %tmp76 to x86_mmx 153*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp76a, x86_mmx* %A 154*9880d681SAndroid Build Coastguard Worker %tmp81 = load x86_mmx, x86_mmx* %B 155*9880d681SAndroid Build Coastguard Worker %tmp76b = bitcast x86_mmx %tmp76a to <4 x i16> 156*9880d681SAndroid Build Coastguard Worker %tmp81a = bitcast x86_mmx %tmp81 to <4 x i16> 157*9880d681SAndroid Build Coastguard Worker %tmp82 = or <4 x i16> %tmp76b, %tmp81a 158*9880d681SAndroid Build Coastguard Worker %tmp82a = bitcast <4 x i16> %tmp82 to x86_mmx 159*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp82a, x86_mmx* %A 160*9880d681SAndroid Build Coastguard Worker %tmp87 = load x86_mmx, x86_mmx* %B 161*9880d681SAndroid Build Coastguard Worker %tmp82b = bitcast x86_mmx %tmp82a to <4 x i16> 162*9880d681SAndroid Build Coastguard Worker %tmp87a = bitcast x86_mmx %tmp87 to <4 x i16> 163*9880d681SAndroid Build Coastguard Worker %tmp88 = xor <4 x i16> %tmp82b, %tmp87a 164*9880d681SAndroid Build Coastguard Worker %tmp88a = bitcast <4 x i16> %tmp88 to x86_mmx 165*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp88a, x86_mmx* %A 166*9880d681SAndroid Build Coastguard Worker tail call void @llvm.x86.mmx.emms( ) 167*9880d681SAndroid Build Coastguard Worker ret void 168*9880d681SAndroid Build Coastguard Worker} 169*9880d681SAndroid Build Coastguard Worker 170*9880d681SAndroid Build Coastguard Worker; X32-LABEL: test3 171*9880d681SAndroid Build Coastguard Workerdefine <1 x i64> @test3(<1 x i64>* %a, <1 x i64>* %b, i32 %count) nounwind { 172*9880d681SAndroid Build Coastguard Workerentry: 173*9880d681SAndroid Build Coastguard Worker %tmp2942 = icmp eq i32 %count, 0 174*9880d681SAndroid Build Coastguard Worker br i1 %tmp2942, label %bb31, label %bb26 175*9880d681SAndroid Build Coastguard Worker 176*9880d681SAndroid Build Coastguard Workerbb26: 177*9880d681SAndroid Build Coastguard Worker; X32: addl 178*9880d681SAndroid Build Coastguard Worker; X32: adcl 179*9880d681SAndroid Build Coastguard Worker %i.037.0 = phi i32 [ 0, %entry ], [ %tmp25, %bb26 ] 180*9880d681SAndroid Build Coastguard Worker %sum.035.0 = phi <1 x i64> [ zeroinitializer, %entry ], [ %tmp22, %bb26 ] 181*9880d681SAndroid Build Coastguard Worker %tmp13 = getelementptr <1 x i64>, <1 x i64>* %b, i32 %i.037.0 182*9880d681SAndroid Build Coastguard Worker %tmp14 = load <1 x i64>, <1 x i64>* %tmp13 183*9880d681SAndroid Build Coastguard Worker %tmp18 = getelementptr <1 x i64>, <1 x i64>* %a, i32 %i.037.0 184*9880d681SAndroid Build Coastguard Worker %tmp19 = load <1 x i64>, <1 x i64>* %tmp18 185*9880d681SAndroid Build Coastguard Worker %tmp21 = add <1 x i64> %tmp19, %tmp14 186*9880d681SAndroid Build Coastguard Worker %tmp22 = add <1 x i64> %tmp21, %sum.035.0 187*9880d681SAndroid Build Coastguard Worker %tmp25 = add i32 %i.037.0, 1 188*9880d681SAndroid Build Coastguard Worker %tmp29 = icmp ult i32 %tmp25, %count 189*9880d681SAndroid Build Coastguard Worker br i1 %tmp29, label %bb26, label %bb31 190*9880d681SAndroid Build Coastguard Worker 191*9880d681SAndroid Build Coastguard Workerbb31: 192*9880d681SAndroid Build Coastguard Worker %sum.035.1 = phi <1 x i64> [ zeroinitializer, %entry ], [ %tmp22, %bb26 ] 193*9880d681SAndroid Build Coastguard Worker ret <1 x i64> %sum.035.1 194*9880d681SAndroid Build Coastguard Worker} 195*9880d681SAndroid Build Coastguard Worker 196*9880d681SAndroid Build Coastguard Worker; There are no MMX operations here, so we use XMM or i64. 197*9880d681SAndroid Build Coastguard Worker; X64-LABEL: ti8 198*9880d681SAndroid Build Coastguard Workerdefine void @ti8(double %a, double %b) nounwind { 199*9880d681SAndroid Build Coastguard Workerentry: 200*9880d681SAndroid Build Coastguard Worker %tmp1 = bitcast double %a to <8 x i8> 201*9880d681SAndroid Build Coastguard Worker %tmp2 = bitcast double %b to <8 x i8> 202*9880d681SAndroid Build Coastguard Worker %tmp3 = add <8 x i8> %tmp1, %tmp2 203*9880d681SAndroid Build Coastguard Worker; X64: paddb 204*9880d681SAndroid Build Coastguard Worker store <8 x i8> %tmp3, <8 x i8>* null 205*9880d681SAndroid Build Coastguard Worker ret void 206*9880d681SAndroid Build Coastguard Worker} 207*9880d681SAndroid Build Coastguard Worker 208*9880d681SAndroid Build Coastguard Worker; X64-LABEL: ti16 209*9880d681SAndroid Build Coastguard Workerdefine void @ti16(double %a, double %b) nounwind { 210*9880d681SAndroid Build Coastguard Workerentry: 211*9880d681SAndroid Build Coastguard Worker %tmp1 = bitcast double %a to <4 x i16> 212*9880d681SAndroid Build Coastguard Worker %tmp2 = bitcast double %b to <4 x i16> 213*9880d681SAndroid Build Coastguard Worker %tmp3 = add <4 x i16> %tmp1, %tmp2 214*9880d681SAndroid Build Coastguard Worker; X64: paddw 215*9880d681SAndroid Build Coastguard Worker store <4 x i16> %tmp3, <4 x i16>* null 216*9880d681SAndroid Build Coastguard Worker ret void 217*9880d681SAndroid Build Coastguard Worker} 218*9880d681SAndroid Build Coastguard Worker 219*9880d681SAndroid Build Coastguard Worker; X64-LABEL: ti32 220*9880d681SAndroid Build Coastguard Workerdefine void @ti32(double %a, double %b) nounwind { 221*9880d681SAndroid Build Coastguard Workerentry: 222*9880d681SAndroid Build Coastguard Worker %tmp1 = bitcast double %a to <2 x i32> 223*9880d681SAndroid Build Coastguard Worker %tmp2 = bitcast double %b to <2 x i32> 224*9880d681SAndroid Build Coastguard Worker %tmp3 = add <2 x i32> %tmp1, %tmp2 225*9880d681SAndroid Build Coastguard Worker; X64: paddd 226*9880d681SAndroid Build Coastguard Worker store <2 x i32> %tmp3, <2 x i32>* null 227*9880d681SAndroid Build Coastguard Worker ret void 228*9880d681SAndroid Build Coastguard Worker} 229*9880d681SAndroid Build Coastguard Worker 230*9880d681SAndroid Build Coastguard Worker; X64-LABEL: ti64 231*9880d681SAndroid Build Coastguard Workerdefine void @ti64(double %a, double %b) nounwind { 232*9880d681SAndroid Build Coastguard Workerentry: 233*9880d681SAndroid Build Coastguard Worker %tmp1 = bitcast double %a to <1 x i64> 234*9880d681SAndroid Build Coastguard Worker %tmp2 = bitcast double %b to <1 x i64> 235*9880d681SAndroid Build Coastguard Worker %tmp3 = add <1 x i64> %tmp1, %tmp2 236*9880d681SAndroid Build Coastguard Worker; X64: addq 237*9880d681SAndroid Build Coastguard Worker store <1 x i64> %tmp3, <1 x i64>* null 238*9880d681SAndroid Build Coastguard Worker ret void 239*9880d681SAndroid Build Coastguard Worker} 240*9880d681SAndroid Build Coastguard Worker 241*9880d681SAndroid Build Coastguard Worker; MMX intrinsics calls get us MMX instructions. 242*9880d681SAndroid Build Coastguard Worker; X64-LABEL: ti8a 243*9880d681SAndroid Build Coastguard Workerdefine void @ti8a(double %a, double %b) nounwind { 244*9880d681SAndroid Build Coastguard Workerentry: 245*9880d681SAndroid Build Coastguard Worker %tmp1 = bitcast double %a to x86_mmx 246*9880d681SAndroid Build Coastguard Worker; X64: movdq2q 247*9880d681SAndroid Build Coastguard Worker %tmp2 = bitcast double %b to x86_mmx 248*9880d681SAndroid Build Coastguard Worker; X64: movdq2q 249*9880d681SAndroid Build Coastguard Worker %tmp3 = tail call x86_mmx @llvm.x86.mmx.padd.b(x86_mmx %tmp1, x86_mmx %tmp2) 250*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp3, x86_mmx* null 251*9880d681SAndroid Build Coastguard Worker ret void 252*9880d681SAndroid Build Coastguard Worker} 253*9880d681SAndroid Build Coastguard Worker 254*9880d681SAndroid Build Coastguard Worker; X64-LABEL: ti16a 255*9880d681SAndroid Build Coastguard Workerdefine void @ti16a(double %a, double %b) nounwind { 256*9880d681SAndroid Build Coastguard Workerentry: 257*9880d681SAndroid Build Coastguard Worker %tmp1 = bitcast double %a to x86_mmx 258*9880d681SAndroid Build Coastguard Worker; X64: movdq2q 259*9880d681SAndroid Build Coastguard Worker %tmp2 = bitcast double %b to x86_mmx 260*9880d681SAndroid Build Coastguard Worker; X64: movdq2q 261*9880d681SAndroid Build Coastguard Worker %tmp3 = tail call x86_mmx @llvm.x86.mmx.padd.w(x86_mmx %tmp1, x86_mmx %tmp2) 262*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp3, x86_mmx* null 263*9880d681SAndroid Build Coastguard Worker ret void 264*9880d681SAndroid Build Coastguard Worker} 265*9880d681SAndroid Build Coastguard Worker 266*9880d681SAndroid Build Coastguard Worker; X64-LABEL: ti32a 267*9880d681SAndroid Build Coastguard Workerdefine void @ti32a(double %a, double %b) nounwind { 268*9880d681SAndroid Build Coastguard Workerentry: 269*9880d681SAndroid Build Coastguard Worker %tmp1 = bitcast double %a to x86_mmx 270*9880d681SAndroid Build Coastguard Worker; X64: movdq2q 271*9880d681SAndroid Build Coastguard Worker %tmp2 = bitcast double %b to x86_mmx 272*9880d681SAndroid Build Coastguard Worker; X64: movdq2q 273*9880d681SAndroid Build Coastguard Worker %tmp3 = tail call x86_mmx @llvm.x86.mmx.padd.d(x86_mmx %tmp1, x86_mmx %tmp2) 274*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp3, x86_mmx* null 275*9880d681SAndroid Build Coastguard Worker ret void 276*9880d681SAndroid Build Coastguard Worker} 277*9880d681SAndroid Build Coastguard Worker 278*9880d681SAndroid Build Coastguard Worker; X64-LABEL: ti64a 279*9880d681SAndroid Build Coastguard Workerdefine void @ti64a(double %a, double %b) nounwind { 280*9880d681SAndroid Build Coastguard Workerentry: 281*9880d681SAndroid Build Coastguard Worker %tmp1 = bitcast double %a to x86_mmx 282*9880d681SAndroid Build Coastguard Worker; X64: movdq2q 283*9880d681SAndroid Build Coastguard Worker %tmp2 = bitcast double %b to x86_mmx 284*9880d681SAndroid Build Coastguard Worker; X64: movdq2q 285*9880d681SAndroid Build Coastguard Worker %tmp3 = tail call x86_mmx @llvm.x86.mmx.padd.q(x86_mmx %tmp1, x86_mmx %tmp2) 286*9880d681SAndroid Build Coastguard Worker store x86_mmx %tmp3, x86_mmx* null 287*9880d681SAndroid Build Coastguard Worker ret void 288*9880d681SAndroid Build Coastguard Worker} 289*9880d681SAndroid Build Coastguard Worker 290*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.padd.b(x86_mmx, x86_mmx) 291*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.padd.w(x86_mmx, x86_mmx) 292*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.padd.d(x86_mmx, x86_mmx) 293*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.padd.q(x86_mmx, x86_mmx) 294*9880d681SAndroid Build Coastguard Worker 295*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.paddus.b(x86_mmx, x86_mmx) 296*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.psubus.b(x86_mmx, x86_mmx) 297*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.paddus.w(x86_mmx, x86_mmx) 298*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.psubus.w(x86_mmx, x86_mmx) 299*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.pmulh.w(x86_mmx, x86_mmx) 300*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.pmadd.wd(x86_mmx, x86_mmx) 301*9880d681SAndroid Build Coastguard Worker 302*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.x86.mmx.emms() 303*9880d681SAndroid Build Coastguard Worker 304*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.padds.b(x86_mmx, x86_mmx) 305*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.padds.w(x86_mmx, x86_mmx) 306*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.psubs.b(x86_mmx, x86_mmx) 307*9880d681SAndroid Build Coastguard Workerdeclare x86_mmx @llvm.x86.mmx.psubs.w(x86_mmx, x86_mmx) 308*9880d681SAndroid Build Coastguard Worker 309