1*9880d681SAndroid Build Coastguard Worker; RUN: llc -mtriple=x86_64-apple-macosx -mattr=+sse2 -verify-machineinstrs < %s | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker 3*9880d681SAndroid Build Coastguard Worker; After tail duplication, two copies in an early exit BB can be cancelled out. 4*9880d681SAndroid Build Coastguard Worker; rdar://10640363 5*9880d681SAndroid Build Coastguard Workerdefine i32 @t1(i32 %a, i32 %b) nounwind { 6*9880d681SAndroid Build Coastguard Workerentry: 7*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: t1: 8*9880d681SAndroid Build Coastguard Worker; CHECK: je [[LABEL:.*BB.*]] 9*9880d681SAndroid Build Coastguard Worker %cmp1 = icmp eq i32 %b, 0 10*9880d681SAndroid Build Coastguard Worker br i1 %cmp1, label %while.end, label %while.body 11*9880d681SAndroid Build Coastguard Worker 12*9880d681SAndroid Build Coastguard Worker; CHECK: [[LABEL]]: 13*9880d681SAndroid Build Coastguard Worker; CHECK-NOT: mov 14*9880d681SAndroid Build Coastguard Worker; CHECK: ret 15*9880d681SAndroid Build Coastguard Worker 16*9880d681SAndroid Build Coastguard Workerwhile.body: ; preds = %entry, %while.body 17*9880d681SAndroid Build Coastguard Worker %a.addr.03 = phi i32 [ %b.addr.02, %while.body ], [ %a, %entry ] 18*9880d681SAndroid Build Coastguard Worker %b.addr.02 = phi i32 [ %rem, %while.body ], [ %b, %entry ] 19*9880d681SAndroid Build Coastguard Worker %rem = srem i32 %a.addr.03, %b.addr.02 20*9880d681SAndroid Build Coastguard Worker %cmp = icmp eq i32 %rem, 0 21*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %while.end, label %while.body 22*9880d681SAndroid Build Coastguard Worker 23*9880d681SAndroid Build Coastguard Workerwhile.end: ; preds = %while.body, %entry 24*9880d681SAndroid Build Coastguard Worker %a.addr.0.lcssa = phi i32 [ %a, %entry ], [ %b.addr.02, %while.body ] 25*9880d681SAndroid Build Coastguard Worker ret i32 %a.addr.0.lcssa 26*9880d681SAndroid Build Coastguard Worker} 27*9880d681SAndroid Build Coastguard Worker 28*9880d681SAndroid Build Coastguard Worker; Two movdqa (from phi-elimination) in the entry BB cancels out. 29*9880d681SAndroid Build Coastguard Worker; rdar://10428165 30*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @t2(<8 x i16> %T0, <8 x i16> %T1) nounwind readnone { 31*9880d681SAndroid Build Coastguard Workerentry: 32*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: t2: 33*9880d681SAndroid Build Coastguard Worker; CHECK-NOT: movdqa 34*9880d681SAndroid Build Coastguard Worker %tmp8 = shufflevector <8 x i16> %T0, <8 x i16> %T1, <8 x i32> < i32 undef, i32 undef, i32 7, i32 2, i32 8, i32 undef, i32 undef , i32 undef > 35*9880d681SAndroid Build Coastguard Worker ret <8 x i16> %tmp8 36*9880d681SAndroid Build Coastguard Worker} 37*9880d681SAndroid Build Coastguard Worker 38*9880d681SAndroid Build Coastguard Workerdefine i32 @t3(i64 %a, i64 %b) nounwind { 39*9880d681SAndroid Build Coastguard Workerentry: 40*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: t3: 41*9880d681SAndroid Build Coastguard Worker; CHECK: je [[LABEL:.*BB.*]] 42*9880d681SAndroid Build Coastguard Worker %cmp1 = icmp eq i64 %b, 0 43*9880d681SAndroid Build Coastguard Worker br i1 %cmp1, label %while.end, label %while.body 44*9880d681SAndroid Build Coastguard Worker 45*9880d681SAndroid Build Coastguard Worker; CHECK: [[LABEL]]: 46*9880d681SAndroid Build Coastguard Worker; CHECK-NOT: mov 47*9880d681SAndroid Build Coastguard Worker; CHECK: ret 48*9880d681SAndroid Build Coastguard Worker 49*9880d681SAndroid Build Coastguard Workerwhile.body: ; preds = %entry, %while.body 50*9880d681SAndroid Build Coastguard Worker %a.addr.03 = phi i64 [ %b.addr.02, %while.body ], [ %a, %entry ] 51*9880d681SAndroid Build Coastguard Worker %b.addr.02 = phi i64 [ %rem, %while.body ], [ %b, %entry ] 52*9880d681SAndroid Build Coastguard Worker %rem = srem i64 %a.addr.03, %b.addr.02 53*9880d681SAndroid Build Coastguard Worker %cmp = icmp eq i64 %rem, 0 54*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %while.end, label %while.body 55*9880d681SAndroid Build Coastguard Worker 56*9880d681SAndroid Build Coastguard Workerwhile.end: ; preds = %while.body, %entry 57*9880d681SAndroid Build Coastguard Worker %a.addr.0.lcssa = phi i64 [ %a, %entry ], [ %b.addr.02, %while.body ] 58*9880d681SAndroid Build Coastguard Worker %t = trunc i64 %a.addr.0.lcssa to i32 59*9880d681SAndroid Build Coastguard Worker ret i32 %t 60*9880d681SAndroid Build Coastguard Worker} 61*9880d681SAndroid Build Coastguard Worker 62*9880d681SAndroid Build Coastguard Worker; Check that copy propagation does not kill thing like: 63*9880d681SAndroid Build Coastguard Worker; dst = copy src <-- do not kill that. 64*9880d681SAndroid Build Coastguard Worker; ... = op1 dst<undef> 65*9880d681SAndroid Build Coastguard Worker; ... = op2 dst <-- this is used here. 66*9880d681SAndroid Build Coastguard Worker; 67*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: foo: 68*9880d681SAndroid Build Coastguard Worker; CHECK: psllw $7, 69*9880d681SAndroid Build Coastguard Worker; CHECK: psllw $7, [[SRC1:%xmm[0-9]+]] 70*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: pand {{.*}}(%rip), [[SRC1]] 71*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: pcmpgtb [[SRC1]], [[SRC2:%xmm[0-9]+]] 72*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: pand %xmm{{[0-9]+}}, [[SRC2]] 73*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: movdqa [[SRC2]], [[CPY1:%xmm[0-9]+]] 74*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: punpcklbw %xmm{{[0-9]+}}, [[CPY1]] 75*9880d681SAndroid Build Coastguard Worker; Check that CPY1 is not redefined. 76*9880d681SAndroid Build Coastguard Worker; CHECK-NOT: , [[CPY1]] 77*9880d681SAndroid Build Coastguard Worker; CHECK: punpckhwd %xmm{{[0-9]+}}, [[CPY1]] 78*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: pslld $31, [[CPY1]] 79*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: psrad $31, [[CPY1]] 80*9880d681SAndroid Build Coastguard Worker; CHECK: punpckhbw %xmm{{[0-9]+}}, [[CPY2:%xmm[0-9]+]] 81*9880d681SAndroid Build Coastguard Worker; Check that CPY2 is not redefined. 82*9880d681SAndroid Build Coastguard Worker; CHECK-NOT: , [[CPY2]] 83*9880d681SAndroid Build Coastguard Worker; CHECK: punpckhwd %xmm{{[0-9]+}}, [[CPY2]] 84*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: pslld $31, [[CPY2]] 85*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: psrad $31, [[CPY2]] 86*9880d681SAndroid Build Coastguard Workerdefine <16 x float> @foo(<16 x float> %x) { 87*9880d681SAndroid Build Coastguard Workerbb: 88*9880d681SAndroid Build Coastguard Worker %v3 = icmp slt <16 x i32> undef, zeroinitializer 89*9880d681SAndroid Build Coastguard Worker %v14 = zext <16 x i1> %v3 to <16 x i32> 90*9880d681SAndroid Build Coastguard Worker %v16 = fcmp olt <16 x float> %x, zeroinitializer 91*9880d681SAndroid Build Coastguard Worker %v17 = sext <16 x i1> %v16 to <16 x i32> 92*9880d681SAndroid Build Coastguard Worker %v18 = zext <16 x i1> %v16 to <16 x i32> 93*9880d681SAndroid Build Coastguard Worker %v19 = xor <16 x i32> %v14, %v18 94*9880d681SAndroid Build Coastguard Worker %v20 = or <16 x i32> %v17, undef 95*9880d681SAndroid Build Coastguard Worker %v21 = fptosi <16 x float> %x to <16 x i32> 96*9880d681SAndroid Build Coastguard Worker %v22 = sitofp <16 x i32> %v21 to <16 x float> 97*9880d681SAndroid Build Coastguard Worker %v69 = fcmp ogt <16 x float> %v22, zeroinitializer 98*9880d681SAndroid Build Coastguard Worker %v75 = and <16 x i1> %v69, %v3 99*9880d681SAndroid Build Coastguard Worker %v77 = bitcast <16 x float> %v22 to <16 x i32> 100*9880d681SAndroid Build Coastguard Worker %v79 = sext <16 x i1> %v75 to <16 x i32> 101*9880d681SAndroid Build Coastguard Worker %v80 = and <16 x i32> undef, %v79 102*9880d681SAndroid Build Coastguard Worker %v81 = xor <16 x i32> %v77, %v80 103*9880d681SAndroid Build Coastguard Worker %v82 = and <16 x i32> undef, %v81 104*9880d681SAndroid Build Coastguard Worker %v83 = xor <16 x i32> %v19, %v82 105*9880d681SAndroid Build Coastguard Worker %v84 = and <16 x i32> %v83, %v20 106*9880d681SAndroid Build Coastguard Worker %v85 = xor <16 x i32> %v19, %v84 107*9880d681SAndroid Build Coastguard Worker %v86 = bitcast <16 x i32> %v85 to <16 x float> 108*9880d681SAndroid Build Coastguard Worker ret <16 x float> %v86 109*9880d681SAndroid Build Coastguard Worker} 110