1*9880d681SAndroid Build Coastguard Worker; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py 2*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-apple-darwin -mattr=+avx | FileCheck %s 3*9880d681SAndroid Build Coastguard Worker 4*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @A(<8 x float> %a) nounwind uwtable readnone ssp { 5*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: A: 6*9880d681SAndroid Build Coastguard Worker; CHECK: ## BB#0: ## %entry 7*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm0 8*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 9*9880d681SAndroid Build Coastguard Workerentry: 10*9880d681SAndroid Build Coastguard Worker %shuffle = shufflevector <8 x float> %a, <8 x float> undef, <8 x i32> <i32 4, i32 5, i32 6, i32 7, i32 8, i32 8, i32 8, i32 8> 11*9880d681SAndroid Build Coastguard Worker ret <8 x float> %shuffle 12*9880d681SAndroid Build Coastguard Worker} 13*9880d681SAndroid Build Coastguard Worker 14*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @B(<4 x double> %a) nounwind uwtable readnone ssp { 15*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: B: 16*9880d681SAndroid Build Coastguard Worker; CHECK: ## BB#0: ## %entry 17*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm0 18*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 19*9880d681SAndroid Build Coastguard Workerentry: 20*9880d681SAndroid Build Coastguard Worker %shuffle = shufflevector <4 x double> %a, <4 x double> undef, <4 x i32> <i32 2, i32 3, i32 4, i32 4> 21*9880d681SAndroid Build Coastguard Worker ret <4 x double> %shuffle 22*9880d681SAndroid Build Coastguard Worker} 23*9880d681SAndroid Build Coastguard Worker 24*9880d681SAndroid Build Coastguard Workerdefine void @t0(float* nocapture %addr, <8 x float> %a) nounwind uwtable ssp { 25*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: t0: 26*9880d681SAndroid Build Coastguard Worker; CHECK: ## BB#0: ## %entry 27*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vextractf128 $1, %ymm0, (%rdi) 28*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vzeroupper 29*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 30*9880d681SAndroid Build Coastguard Workerentry: 31*9880d681SAndroid Build Coastguard Worker %0 = tail call <4 x float> @llvm.x86.avx.vextractf128.ps.256(<8 x float> %a, i8 1) 32*9880d681SAndroid Build Coastguard Worker %1 = bitcast float* %addr to <4 x float>* 33*9880d681SAndroid Build Coastguard Worker store <4 x float> %0, <4 x float>* %1, align 16 34*9880d681SAndroid Build Coastguard Worker ret void 35*9880d681SAndroid Build Coastguard Worker} 36*9880d681SAndroid Build Coastguard Worker 37*9880d681SAndroid Build Coastguard Workerdefine void @t2(double* nocapture %addr, <4 x double> %a) nounwind uwtable ssp { 38*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: t2: 39*9880d681SAndroid Build Coastguard Worker; CHECK: ## BB#0: ## %entry 40*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vextractf128 $1, %ymm0, (%rdi) 41*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vzeroupper 42*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 43*9880d681SAndroid Build Coastguard Workerentry: 44*9880d681SAndroid Build Coastguard Worker %0 = tail call <2 x double> @llvm.x86.avx.vextractf128.pd.256(<4 x double> %a, i8 1) 45*9880d681SAndroid Build Coastguard Worker %1 = bitcast double* %addr to <2 x double>* 46*9880d681SAndroid Build Coastguard Worker store <2 x double> %0, <2 x double>* %1, align 16 47*9880d681SAndroid Build Coastguard Worker ret void 48*9880d681SAndroid Build Coastguard Worker} 49*9880d681SAndroid Build Coastguard Worker 50*9880d681SAndroid Build Coastguard Workerdefine void @t4(<2 x i64>* nocapture %addr, <4 x i64> %a) nounwind uwtable ssp { 51*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: t4: 52*9880d681SAndroid Build Coastguard Worker; CHECK: ## BB#0: ## %entry 53*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vextractf128 $1, %ymm0, (%rdi) 54*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vzeroupper 55*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 56*9880d681SAndroid Build Coastguard Workerentry: 57*9880d681SAndroid Build Coastguard Worker %0 = bitcast <4 x i64> %a to <8 x i32> 58*9880d681SAndroid Build Coastguard Worker %1 = tail call <4 x i32> @llvm.x86.avx.vextractf128.si.256(<8 x i32> %0, i8 1) 59*9880d681SAndroid Build Coastguard Worker %2 = bitcast <4 x i32> %1 to <2 x i64> 60*9880d681SAndroid Build Coastguard Worker store <2 x i64> %2, <2 x i64>* %addr, align 16 61*9880d681SAndroid Build Coastguard Worker ret void 62*9880d681SAndroid Build Coastguard Worker} 63*9880d681SAndroid Build Coastguard Worker 64*9880d681SAndroid Build Coastguard Workerdefine void @t5(float* nocapture %addr, <8 x float> %a) nounwind uwtable ssp { 65*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: t5: 66*9880d681SAndroid Build Coastguard Worker; CHECK: ## BB#0: ## %entry 67*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vmovaps %xmm0, (%rdi) 68*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vzeroupper 69*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 70*9880d681SAndroid Build Coastguard Workerentry: 71*9880d681SAndroid Build Coastguard Worker %0 = tail call <4 x float> @llvm.x86.avx.vextractf128.ps.256(<8 x float> %a, i8 0) 72*9880d681SAndroid Build Coastguard Worker %1 = bitcast float* %addr to <4 x float>* 73*9880d681SAndroid Build Coastguard Worker store <4 x float> %0, <4 x float>* %1, align 16 74*9880d681SAndroid Build Coastguard Worker ret void 75*9880d681SAndroid Build Coastguard Worker} 76*9880d681SAndroid Build Coastguard Worker 77*9880d681SAndroid Build Coastguard Workerdefine void @t6(double* nocapture %addr, <4 x double> %a) nounwind uwtable ssp { 78*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: t6: 79*9880d681SAndroid Build Coastguard Worker; CHECK: ## BB#0: ## %entry 80*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vmovaps %xmm0, (%rdi) 81*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vzeroupper 82*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 83*9880d681SAndroid Build Coastguard Workerentry: 84*9880d681SAndroid Build Coastguard Worker %0 = tail call <2 x double> @llvm.x86.avx.vextractf128.pd.256(<4 x double> %a, i8 0) 85*9880d681SAndroid Build Coastguard Worker %1 = bitcast double* %addr to <2 x double>* 86*9880d681SAndroid Build Coastguard Worker store <2 x double> %0, <2 x double>* %1, align 16 87*9880d681SAndroid Build Coastguard Worker ret void 88*9880d681SAndroid Build Coastguard Worker} 89*9880d681SAndroid Build Coastguard Worker 90*9880d681SAndroid Build Coastguard Workerdefine void @t7(<2 x i64>* nocapture %addr, <4 x i64> %a) nounwind uwtable ssp { 91*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: t7: 92*9880d681SAndroid Build Coastguard Worker; CHECK: ## BB#0: ## %entry 93*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vmovaps %xmm0, (%rdi) 94*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vzeroupper 95*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 96*9880d681SAndroid Build Coastguard Workerentry: 97*9880d681SAndroid Build Coastguard Worker %0 = bitcast <4 x i64> %a to <8 x i32> 98*9880d681SAndroid Build Coastguard Worker %1 = tail call <4 x i32> @llvm.x86.avx.vextractf128.si.256(<8 x i32> %0, i8 0) 99*9880d681SAndroid Build Coastguard Worker %2 = bitcast <4 x i32> %1 to <2 x i64> 100*9880d681SAndroid Build Coastguard Worker store <2 x i64> %2, <2 x i64>* %addr, align 16 101*9880d681SAndroid Build Coastguard Worker ret void 102*9880d681SAndroid Build Coastguard Worker} 103*9880d681SAndroid Build Coastguard Worker 104*9880d681SAndroid Build Coastguard Workerdefine void @t8(<2 x i64>* nocapture %addr, <4 x i64> %a) nounwind uwtable ssp { 105*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: t8: 106*9880d681SAndroid Build Coastguard Worker; CHECK: ## BB#0: ## %entry 107*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vmovups %xmm0, (%rdi) 108*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vzeroupper 109*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 110*9880d681SAndroid Build Coastguard Workerentry: 111*9880d681SAndroid Build Coastguard Worker %0 = bitcast <4 x i64> %a to <8 x i32> 112*9880d681SAndroid Build Coastguard Worker %1 = tail call <4 x i32> @llvm.x86.avx.vextractf128.si.256(<8 x i32> %0, i8 0) 113*9880d681SAndroid Build Coastguard Worker %2 = bitcast <4 x i32> %1 to <2 x i64> 114*9880d681SAndroid Build Coastguard Worker store <2 x i64> %2, <2 x i64>* %addr, align 1 115*9880d681SAndroid Build Coastguard Worker ret void 116*9880d681SAndroid Build Coastguard Worker} 117*9880d681SAndroid Build Coastguard Worker 118*9880d681SAndroid Build Coastguard Worker; PR15462 119*9880d681SAndroid Build Coastguard Workerdefine void @t9(i64* %p) { 120*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: t9: 121*9880d681SAndroid Build Coastguard Worker; CHECK: ## BB#0: 122*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vxorps %ymm0, %ymm0, %ymm0 123*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vmovups %ymm0, (%rdi) 124*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: vzeroupper 125*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 126*9880d681SAndroid Build Coastguard Worker store i64 0, i64* %p 127*9880d681SAndroid Build Coastguard Worker %q = getelementptr i64, i64* %p, i64 1 128*9880d681SAndroid Build Coastguard Worker store i64 0, i64* %q 129*9880d681SAndroid Build Coastguard Worker %r = getelementptr i64, i64* %p, i64 2 130*9880d681SAndroid Build Coastguard Worker store i64 0, i64* %r 131*9880d681SAndroid Build Coastguard Worker %s = getelementptr i64, i64* %p, i64 3 132*9880d681SAndroid Build Coastguard Worker store i64 0, i64* %s 133*9880d681SAndroid Build Coastguard Worker ret void 134*9880d681SAndroid Build Coastguard Worker} 135*9880d681SAndroid Build Coastguard Worker 136*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.x86.avx.vextractf128.pd.256(<4 x double>, i8) nounwind readnone 137*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.x86.avx.vextractf128.ps.256(<8 x float>, i8) nounwind readnone 138*9880d681SAndroid Build Coastguard Workerdeclare <4 x i32> @llvm.x86.avx.vextractf128.si.256(<8 x i32>, i8) nounwind readnone 139