1*9880d681SAndroid Build Coastguard Worker; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py 2*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2 3*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE3 4*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+ssse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSSE3 5*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41 6*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx | FileCheck %s --check-prefix=ALL --check-prefix=AVX --check-prefix=AVX1 7*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx2 | FileCheck %s --check-prefix=ALL --check-prefix=AVX --check-prefix=AVX2 8*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx512cd,+avx512vl | FileCheck %s --check-prefix=ALL --check-prefix=AVX --check-prefix=AVX512CDVL 9*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx512cd,-avx512vl | FileCheck %s --check-prefix=ALL --check-prefix=AVX --check-prefix=AVX512CD 10*9880d681SAndroid Build Coastguard Worker; 11*9880d681SAndroid Build Coastguard Worker; Just one 32-bit run to make sure we do reasonable things for i64 tzcnt. 12*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=i686-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=X32-SSE --check-prefix=X32-SSE41 13*9880d681SAndroid Build Coastguard Worker 14*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @testv2i64(<2 x i64> %in) nounwind { 15*9880d681SAndroid Build Coastguard Worker; SSE2-LABEL: testv2i64: 16*9880d681SAndroid Build Coastguard Worker; SSE2: # BB#0: 17*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movd %xmm0, %rax 18*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: bsfq %rax, %rax 19*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movl $64, %ecx 20*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: cmoveq %rcx, %rax 21*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movd %rax, %xmm1 22*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,0,1] 23*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movd %xmm0, %rax 24*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: bsfq %rax, %rax 25*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: cmoveq %rcx, %rax 26*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movd %rax, %xmm0 27*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: punpcklqdq {{.*#+}} xmm1 = xmm1[0],xmm0[0] 28*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm0 29*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: retq 30*9880d681SAndroid Build Coastguard Worker; 31*9880d681SAndroid Build Coastguard Worker; SSE3-LABEL: testv2i64: 32*9880d681SAndroid Build Coastguard Worker; SSE3: # BB#0: 33*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movd %xmm0, %rax 34*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: bsfq %rax, %rax 35*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movl $64, %ecx 36*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: cmoveq %rcx, %rax 37*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movd %rax, %xmm1 38*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,0,1] 39*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movd %xmm0, %rax 40*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: bsfq %rax, %rax 41*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: cmoveq %rcx, %rax 42*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movd %rax, %xmm0 43*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: punpcklqdq {{.*#+}} xmm1 = xmm1[0],xmm0[0] 44*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm0 45*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: retq 46*9880d681SAndroid Build Coastguard Worker; 47*9880d681SAndroid Build Coastguard Worker; SSSE3-LABEL: testv2i64: 48*9880d681SAndroid Build Coastguard Worker; SSSE3: # BB#0: 49*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movd %xmm0, %rax 50*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: bsfq %rax, %rax 51*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movl $64, %ecx 52*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: cmoveq %rcx, %rax 53*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movd %rax, %xmm1 54*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,0,1] 55*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movd %xmm0, %rax 56*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: bsfq %rax, %rax 57*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: cmoveq %rcx, %rax 58*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movd %rax, %xmm0 59*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: punpcklqdq {{.*#+}} xmm1 = xmm1[0],xmm0[0] 60*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm1, %xmm0 61*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: retq 62*9880d681SAndroid Build Coastguard Worker; 63*9880d681SAndroid Build Coastguard Worker; SSE41-LABEL: testv2i64: 64*9880d681SAndroid Build Coastguard Worker; SSE41: # BB#0: 65*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pextrq $1, %xmm0, %rax 66*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: bsfq %rax, %rax 67*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movl $64, %ecx 68*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: cmoveq %rcx, %rax 69*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movd %rax, %xmm1 70*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movd %xmm0, %rax 71*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: bsfq %rax, %rax 72*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: cmoveq %rcx, %rax 73*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movd %rax, %xmm0 74*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: punpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0] 75*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: retq 76*9880d681SAndroid Build Coastguard Worker; 77*9880d681SAndroid Build Coastguard Worker; AVX-LABEL: testv2i64: 78*9880d681SAndroid Build Coastguard Worker; AVX: # BB#0: 79*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: vpextrq $1, %xmm0, %rax 80*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: bsfq %rax, %rax 81*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: movl $64, %ecx 82*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: cmoveq %rcx, %rax 83*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: vmovq %rax, %xmm1 84*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: vmovq %xmm0, %rax 85*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: bsfq %rax, %rax 86*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: cmoveq %rcx, %rax 87*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: vmovq %rax, %xmm0 88*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0] 89*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: retq 90*9880d681SAndroid Build Coastguard Worker; 91*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: testv2i64: 92*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 93*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pushl %esi 94*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pextrd $3, %xmm0, %eax 95*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: bsfl %eax, %eax 96*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movl $32, %ecx 97*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: cmovel %ecx, %eax 98*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: addl $32, %eax 99*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pextrd $2, %xmm0, %edx 100*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: bsfl %edx, %esi 101*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: testl %edx, %edx 102*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: cmovel %eax, %esi 103*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movd %esi, %xmm1 104*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pextrd $1, %xmm0, %eax 105*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: bsfl %eax, %eax 106*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: cmovel %ecx, %eax 107*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: addl $32, %eax 108*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movd %xmm0, %ecx 109*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: bsfl %ecx, %edx 110*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: testl %ecx, %ecx 111*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: cmovel %eax, %edx 112*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movd %edx, %xmm0 113*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: punpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0] 114*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: popl %esi 115*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 116*9880d681SAndroid Build Coastguard Worker %out = call <2 x i64> @llvm.cttz.v2i64(<2 x i64> %in, i1 0) 117*9880d681SAndroid Build Coastguard Worker ret <2 x i64> %out 118*9880d681SAndroid Build Coastguard Worker} 119*9880d681SAndroid Build Coastguard Worker 120*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @testv2i64u(<2 x i64> %in) nounwind { 121*9880d681SAndroid Build Coastguard Worker; SSE2-LABEL: testv2i64u: 122*9880d681SAndroid Build Coastguard Worker; SSE2: # BB#0: 123*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movd %xmm0, %rax 124*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: bsfq %rax, %rax 125*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movd %rax, %xmm1 126*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,0,1] 127*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movd %xmm0, %rax 128*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: bsfq %rax, %rax 129*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movd %rax, %xmm0 130*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: punpcklqdq {{.*#+}} xmm1 = xmm1[0],xmm0[0] 131*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm0 132*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: retq 133*9880d681SAndroid Build Coastguard Worker; 134*9880d681SAndroid Build Coastguard Worker; SSE3-LABEL: testv2i64u: 135*9880d681SAndroid Build Coastguard Worker; SSE3: # BB#0: 136*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movd %xmm0, %rax 137*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: bsfq %rax, %rax 138*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movd %rax, %xmm1 139*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,0,1] 140*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movd %xmm0, %rax 141*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: bsfq %rax, %rax 142*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movd %rax, %xmm0 143*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: punpcklqdq {{.*#+}} xmm1 = xmm1[0],xmm0[0] 144*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm0 145*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: retq 146*9880d681SAndroid Build Coastguard Worker; 147*9880d681SAndroid Build Coastguard Worker; SSSE3-LABEL: testv2i64u: 148*9880d681SAndroid Build Coastguard Worker; SSSE3: # BB#0: 149*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movd %xmm0, %rax 150*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: bsfq %rax, %rax 151*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movd %rax, %xmm1 152*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,0,1] 153*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movd %xmm0, %rax 154*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: bsfq %rax, %rax 155*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movd %rax, %xmm0 156*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: punpcklqdq {{.*#+}} xmm1 = xmm1[0],xmm0[0] 157*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm1, %xmm0 158*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: retq 159*9880d681SAndroid Build Coastguard Worker; 160*9880d681SAndroid Build Coastguard Worker; SSE41-LABEL: testv2i64u: 161*9880d681SAndroid Build Coastguard Worker; SSE41: # BB#0: 162*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pextrq $1, %xmm0, %rax 163*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: bsfq %rax, %rax 164*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movd %rax, %xmm1 165*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movd %xmm0, %rax 166*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: bsfq %rax, %rax 167*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movd %rax, %xmm0 168*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: punpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0] 169*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: retq 170*9880d681SAndroid Build Coastguard Worker; 171*9880d681SAndroid Build Coastguard Worker; AVX1-LABEL: testv2i64u: 172*9880d681SAndroid Build Coastguard Worker; AVX1: # BB#0: 173*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpextrq $1, %xmm0, %rax 174*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: bsfq %rax, %rax 175*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovq %rax, %xmm1 176*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovq %xmm0, %rax 177*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: bsfq %rax, %rax 178*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovq %rax, %xmm0 179*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0] 180*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: retq 181*9880d681SAndroid Build Coastguard Worker; 182*9880d681SAndroid Build Coastguard Worker; AVX2-LABEL: testv2i64u: 183*9880d681SAndroid Build Coastguard Worker; AVX2: # BB#0: 184*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpextrq $1, %xmm0, %rax 185*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: bsfq %rax, %rax 186*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovq %rax, %xmm1 187*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovq %xmm0, %rax 188*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: bsfq %rax, %rax 189*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovq %rax, %xmm0 190*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0] 191*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: retq 192*9880d681SAndroid Build Coastguard Worker; 193*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-LABEL: testv2i64u: 194*9880d681SAndroid Build Coastguard Worker; AVX512CDVL: # BB#0: 195*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpxord %xmm1, %xmm1, %xmm1 196*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubq %xmm0, %xmm1, %xmm1 197*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm1, %xmm0, %xmm0 198*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vplzcntq %xmm0, %xmm0 199*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm1 = [63,63] 200*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubq %xmm0, %xmm1, %xmm0 201*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: retq 202*9880d681SAndroid Build Coastguard Worker; 203*9880d681SAndroid Build Coastguard Worker; AVX512CD-LABEL: testv2i64u: 204*9880d681SAndroid Build Coastguard Worker; AVX512CD: # BB#0: 205*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpxor %xmm1, %xmm1, %xmm1 206*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubq %xmm0, %xmm1, %xmm1 207*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm0 208*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vplzcntq %zmm0, %zmm0 209*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovdqa {{.*#+}} xmm1 = [63,63] 210*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubq %xmm0, %xmm1, %xmm0 211*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: retq 212*9880d681SAndroid Build Coastguard Worker; 213*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: testv2i64u: 214*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 215*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pextrd $2, %xmm0, %eax 216*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: bsfl %eax, %ecx 217*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pextrd $3, %xmm0, %edx 218*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: bsfl %edx, %edx 219*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: addl $32, %edx 220*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: testl %eax, %eax 221*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: cmovnel %ecx, %edx 222*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movd %edx, %xmm1 223*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movd %xmm0, %eax 224*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: bsfl %eax, %ecx 225*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pextrd $1, %xmm0, %edx 226*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: bsfl %edx, %edx 227*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: addl $32, %edx 228*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: testl %eax, %eax 229*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: cmovnel %ecx, %edx 230*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movd %edx, %xmm0 231*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: punpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0] 232*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 233*9880d681SAndroid Build Coastguard Worker %out = call <2 x i64> @llvm.cttz.v2i64(<2 x i64> %in, i1 -1) 234*9880d681SAndroid Build Coastguard Worker ret <2 x i64> %out 235*9880d681SAndroid Build Coastguard Worker} 236*9880d681SAndroid Build Coastguard Worker 237*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @testv4i32(<4 x i32> %in) nounwind { 238*9880d681SAndroid Build Coastguard Worker; SSE2-LABEL: testv4i32: 239*9880d681SAndroid Build Coastguard Worker; SSE2: # BB#0: 240*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pxor %xmm1, %xmm1 241*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pxor %xmm2, %xmm2 242*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubd %xmm0, %xmm2 243*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm2 244*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubd {{.*}}(%rip), %xmm2 245*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm2, %xmm0 246*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrld $1, %xmm0 247*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand {{.*}}(%rip), %xmm0 248*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubd %xmm0, %xmm2 249*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa {{.*#+}} xmm0 = [858993459,858993459,858993459,858993459] 250*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm2, %xmm3 251*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm3 252*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrld $2, %xmm2 253*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm2 254*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddd %xmm3, %xmm2 255*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm2, %xmm0 256*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrld $4, %xmm0 257*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddd %xmm2, %xmm0 258*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand {{.*}}(%rip), %xmm0 259*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm0, %xmm2 260*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: punpckhdq {{.*#+}} xmm2 = xmm2[2],xmm1[2],xmm2[3],xmm1[3] 261*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psadbw %xmm1, %xmm2 262*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: punpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 263*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psadbw %xmm1, %xmm0 264*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: packuswb %xmm2, %xmm0 265*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: retq 266*9880d681SAndroid Build Coastguard Worker; 267*9880d681SAndroid Build Coastguard Worker; SSE3-LABEL: testv4i32: 268*9880d681SAndroid Build Coastguard Worker; SSE3: # BB#0: 269*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pxor %xmm1, %xmm1 270*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pxor %xmm2, %xmm2 271*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubd %xmm0, %xmm2 272*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm2 273*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubd {{.*}}(%rip), %xmm2 274*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm2, %xmm0 275*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrld $1, %xmm0 276*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand {{.*}}(%rip), %xmm0 277*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubd %xmm0, %xmm2 278*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa {{.*#+}} xmm0 = [858993459,858993459,858993459,858993459] 279*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm2, %xmm3 280*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm3 281*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrld $2, %xmm2 282*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm2 283*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddd %xmm3, %xmm2 284*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm2, %xmm0 285*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrld $4, %xmm0 286*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddd %xmm2, %xmm0 287*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand {{.*}}(%rip), %xmm0 288*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm0, %xmm2 289*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: punpckhdq {{.*#+}} xmm2 = xmm2[2],xmm1[2],xmm2[3],xmm1[3] 290*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psadbw %xmm1, %xmm2 291*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: punpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 292*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psadbw %xmm1, %xmm0 293*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: packuswb %xmm2, %xmm0 294*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: retq 295*9880d681SAndroid Build Coastguard Worker; 296*9880d681SAndroid Build Coastguard Worker; SSSE3-LABEL: testv4i32: 297*9880d681SAndroid Build Coastguard Worker; SSSE3: # BB#0: 298*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pxor %xmm1, %xmm1 299*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pxor %xmm2, %xmm2 300*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psubd %xmm0, %xmm2 301*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm0, %xmm2 302*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psubd {{.*}}(%rip), %xmm2 303*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa {{.*#+}} xmm3 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 304*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm2, %xmm4 305*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm3, %xmm4 306*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa {{.*#+}} xmm0 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 307*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm0, %xmm5 308*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufb %xmm4, %xmm5 309*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psrlw $4, %xmm2 310*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm3, %xmm2 311*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufb %xmm2, %xmm0 312*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: paddb %xmm5, %xmm0 313*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm0, %xmm2 314*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: punpckhdq {{.*#+}} xmm2 = xmm2[2],xmm1[2],xmm2[3],xmm1[3] 315*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psadbw %xmm1, %xmm2 316*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: punpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 317*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psadbw %xmm1, %xmm0 318*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: packuswb %xmm2, %xmm0 319*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: retq 320*9880d681SAndroid Build Coastguard Worker; 321*9880d681SAndroid Build Coastguard Worker; SSE41-LABEL: testv4i32: 322*9880d681SAndroid Build Coastguard Worker; SSE41: # BB#0: 323*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pxor %xmm1, %xmm1 324*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pxor %xmm2, %xmm2 325*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psubd %xmm0, %xmm2 326*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm0, %xmm2 327*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psubd {{.*}}(%rip), %xmm2 328*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa {{.*#+}} xmm3 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 329*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm2, %xmm4 330*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm3, %xmm4 331*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa {{.*#+}} xmm0 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 332*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm0, %xmm5 333*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pshufb %xmm4, %xmm5 334*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psrlw $4, %xmm2 335*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm3, %xmm2 336*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pshufb %xmm2, %xmm0 337*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: paddb %xmm5, %xmm0 338*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm0, %xmm2 339*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: punpckhdq {{.*#+}} xmm2 = xmm2[2],xmm1[2],xmm2[3],xmm1[3] 340*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psadbw %xmm1, %xmm2 341*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: punpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 342*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psadbw %xmm1, %xmm0 343*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: packuswb %xmm2, %xmm0 344*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: retq 345*9880d681SAndroid Build Coastguard Worker; 346*9880d681SAndroid Build Coastguard Worker; AVX1-LABEL: testv4i32: 347*9880d681SAndroid Build Coastguard Worker; AVX1: # BB#0: 348*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpxor %xmm1, %xmm1, %xmm1 349*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsubd %xmm0, %xmm1, %xmm2 350*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm2, %xmm0, %xmm0 351*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsubd {{.*}}(%rip), %xmm0, %xmm0 352*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovdqa {{.*#+}} xmm2 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 353*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm2, %xmm0, %xmm3 354*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovdqa {{.*#+}} xmm4 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 355*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpshufb %xmm3, %xmm4, %xmm3 356*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsrlw $4, %xmm0, %xmm0 357*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm2, %xmm0, %xmm0 358*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpshufb %xmm0, %xmm4, %xmm0 359*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpaddb %xmm3, %xmm0, %xmm0 360*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpunpckhdq {{.*#+}} xmm2 = xmm0[2],xmm1[2],xmm0[3],xmm1[3] 361*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsadbw %xmm1, %xmm2, %xmm2 362*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpunpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 363*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsadbw %xmm1, %xmm0, %xmm0 364*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpackuswb %xmm2, %xmm0, %xmm0 365*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: retq 366*9880d681SAndroid Build Coastguard Worker; 367*9880d681SAndroid Build Coastguard Worker; AVX2-LABEL: testv4i32: 368*9880d681SAndroid Build Coastguard Worker; AVX2: # BB#0: 369*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpxor %xmm1, %xmm1, %xmm1 370*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsubd %xmm0, %xmm1, %xmm2 371*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm2, %xmm0, %xmm0 372*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpbroadcastd {{.*}}(%rip), %xmm2 373*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsubd %xmm2, %xmm0, %xmm0 374*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovdqa {{.*#+}} xmm2 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 375*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm2, %xmm0, %xmm3 376*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovdqa {{.*#+}} xmm4 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 377*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpshufb %xmm3, %xmm4, %xmm3 378*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsrlw $4, %xmm0, %xmm0 379*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm2, %xmm0, %xmm0 380*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpshufb %xmm0, %xmm4, %xmm0 381*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpaddb %xmm3, %xmm0, %xmm0 382*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpunpckhdq {{.*#+}} xmm2 = xmm0[2],xmm1[2],xmm0[3],xmm1[3] 383*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsadbw %xmm1, %xmm2, %xmm2 384*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpunpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 385*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsadbw %xmm1, %xmm0, %xmm0 386*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpackuswb %xmm2, %xmm0, %xmm0 387*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: retq 388*9880d681SAndroid Build Coastguard Worker; 389*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-LABEL: testv4i32: 390*9880d681SAndroid Build Coastguard Worker; AVX512CDVL: # BB#0: 391*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpxord %xmm1, %xmm1, %xmm1 392*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubd %xmm0, %xmm1, %xmm2 393*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandd %xmm2, %xmm0, %xmm0 394*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubd {{.*}}(%rip){1to4}, %xmm0, %xmm0 395*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm2 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 396*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm2, %xmm0, %xmm3 397*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm4 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 398*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpshufb %xmm3, %xmm4, %xmm3 399*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsrlw $4, %xmm0, %xmm0 400*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm2, %xmm0, %xmm0 401*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpshufb %xmm0, %xmm4, %xmm0 402*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpaddb %xmm3, %xmm0, %xmm0 403*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpunpckhdq {{.*#+}} xmm2 = xmm0[2],xmm1[2],xmm0[3],xmm1[3] 404*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsadbw %xmm1, %xmm2, %xmm2 405*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpunpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 406*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsadbw %xmm1, %xmm0, %xmm0 407*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpackuswb %xmm2, %xmm0, %xmm0 408*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: retq 409*9880d681SAndroid Build Coastguard Worker; 410*9880d681SAndroid Build Coastguard Worker; AVX512CD-LABEL: testv4i32: 411*9880d681SAndroid Build Coastguard Worker; AVX512CD: # BB#0: 412*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpxor %xmm1, %xmm1, %xmm1 413*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubd %xmm0, %xmm1, %xmm2 414*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm2, %xmm0, %xmm0 415*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpbroadcastd {{.*}}(%rip), %xmm2 416*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubd %xmm2, %xmm0, %xmm0 417*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovdqa {{.*#+}} xmm2 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 418*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm2, %xmm0, %xmm3 419*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovdqa {{.*#+}} xmm4 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 420*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpshufb %xmm3, %xmm4, %xmm3 421*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsrlw $4, %xmm0, %xmm0 422*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm2, %xmm0, %xmm0 423*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpshufb %xmm0, %xmm4, %xmm0 424*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpaddb %xmm3, %xmm0, %xmm0 425*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpunpckhdq {{.*#+}} xmm2 = xmm0[2],xmm1[2],xmm0[3],xmm1[3] 426*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsadbw %xmm1, %xmm2, %xmm2 427*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpunpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 428*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsadbw %xmm1, %xmm0, %xmm0 429*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpackuswb %xmm2, %xmm0, %xmm0 430*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: retq 431*9880d681SAndroid Build Coastguard Worker; 432*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: testv4i32: 433*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 434*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pxor %xmm1, %xmm1 435*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pxor %xmm2, %xmm2 436*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psubd %xmm0, %xmm2 437*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm0, %xmm2 438*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psubd {{\.LCPI.*}}, %xmm2 439*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa {{.*#+}} xmm3 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 440*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm2, %xmm4 441*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm3, %xmm4 442*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa {{.*#+}} xmm0 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 443*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm0, %xmm5 444*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pshufb %xmm4, %xmm5 445*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psrlw $4, %xmm2 446*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm3, %xmm2 447*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pshufb %xmm2, %xmm0 448*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: paddb %xmm5, %xmm0 449*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm0, %xmm2 450*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: punpckhdq {{.*#+}} xmm2 = xmm2[2],xmm1[2],xmm2[3],xmm1[3] 451*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psadbw %xmm1, %xmm2 452*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: punpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 453*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psadbw %xmm1, %xmm0 454*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: packuswb %xmm2, %xmm0 455*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 456*9880d681SAndroid Build Coastguard Worker %out = call <4 x i32> @llvm.cttz.v4i32(<4 x i32> %in, i1 0) 457*9880d681SAndroid Build Coastguard Worker ret <4 x i32> %out 458*9880d681SAndroid Build Coastguard Worker} 459*9880d681SAndroid Build Coastguard Worker 460*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @testv4i32u(<4 x i32> %in) nounwind { 461*9880d681SAndroid Build Coastguard Worker; SSE2-LABEL: testv4i32u: 462*9880d681SAndroid Build Coastguard Worker; SSE2: # BB#0: 463*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pxor %xmm1, %xmm1 464*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pxor %xmm2, %xmm2 465*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubd %xmm0, %xmm2 466*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm2 467*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubd {{.*}}(%rip), %xmm2 468*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm2, %xmm0 469*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrld $1, %xmm0 470*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand {{.*}}(%rip), %xmm0 471*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubd %xmm0, %xmm2 472*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa {{.*#+}} xmm0 = [858993459,858993459,858993459,858993459] 473*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm2, %xmm3 474*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm3 475*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrld $2, %xmm2 476*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm2 477*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddd %xmm3, %xmm2 478*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm2, %xmm0 479*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrld $4, %xmm0 480*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddd %xmm2, %xmm0 481*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand {{.*}}(%rip), %xmm0 482*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm0, %xmm2 483*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: punpckhdq {{.*#+}} xmm2 = xmm2[2],xmm1[2],xmm2[3],xmm1[3] 484*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psadbw %xmm1, %xmm2 485*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: punpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 486*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psadbw %xmm1, %xmm0 487*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: packuswb %xmm2, %xmm0 488*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: retq 489*9880d681SAndroid Build Coastguard Worker; 490*9880d681SAndroid Build Coastguard Worker; SSE3-LABEL: testv4i32u: 491*9880d681SAndroid Build Coastguard Worker; SSE3: # BB#0: 492*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pxor %xmm1, %xmm1 493*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pxor %xmm2, %xmm2 494*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubd %xmm0, %xmm2 495*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm2 496*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubd {{.*}}(%rip), %xmm2 497*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm2, %xmm0 498*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrld $1, %xmm0 499*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand {{.*}}(%rip), %xmm0 500*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubd %xmm0, %xmm2 501*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa {{.*#+}} xmm0 = [858993459,858993459,858993459,858993459] 502*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm2, %xmm3 503*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm3 504*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrld $2, %xmm2 505*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm2 506*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddd %xmm3, %xmm2 507*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm2, %xmm0 508*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrld $4, %xmm0 509*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddd %xmm2, %xmm0 510*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand {{.*}}(%rip), %xmm0 511*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm0, %xmm2 512*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: punpckhdq {{.*#+}} xmm2 = xmm2[2],xmm1[2],xmm2[3],xmm1[3] 513*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psadbw %xmm1, %xmm2 514*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: punpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 515*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psadbw %xmm1, %xmm0 516*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: packuswb %xmm2, %xmm0 517*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: retq 518*9880d681SAndroid Build Coastguard Worker; 519*9880d681SAndroid Build Coastguard Worker; SSSE3-LABEL: testv4i32u: 520*9880d681SAndroid Build Coastguard Worker; SSSE3: # BB#0: 521*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pxor %xmm1, %xmm1 522*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pxor %xmm2, %xmm2 523*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psubd %xmm0, %xmm2 524*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm0, %xmm2 525*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psubd {{.*}}(%rip), %xmm2 526*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa {{.*#+}} xmm3 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 527*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm2, %xmm4 528*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm3, %xmm4 529*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa {{.*#+}} xmm0 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 530*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm0, %xmm5 531*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufb %xmm4, %xmm5 532*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psrlw $4, %xmm2 533*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm3, %xmm2 534*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufb %xmm2, %xmm0 535*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: paddb %xmm5, %xmm0 536*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm0, %xmm2 537*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: punpckhdq {{.*#+}} xmm2 = xmm2[2],xmm1[2],xmm2[3],xmm1[3] 538*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psadbw %xmm1, %xmm2 539*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: punpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 540*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psadbw %xmm1, %xmm0 541*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: packuswb %xmm2, %xmm0 542*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: retq 543*9880d681SAndroid Build Coastguard Worker; 544*9880d681SAndroid Build Coastguard Worker; SSE41-LABEL: testv4i32u: 545*9880d681SAndroid Build Coastguard Worker; SSE41: # BB#0: 546*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pxor %xmm1, %xmm1 547*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pxor %xmm2, %xmm2 548*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psubd %xmm0, %xmm2 549*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm0, %xmm2 550*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psubd {{.*}}(%rip), %xmm2 551*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa {{.*#+}} xmm3 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 552*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm2, %xmm4 553*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm3, %xmm4 554*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa {{.*#+}} xmm0 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 555*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm0, %xmm5 556*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pshufb %xmm4, %xmm5 557*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psrlw $4, %xmm2 558*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm3, %xmm2 559*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pshufb %xmm2, %xmm0 560*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: paddb %xmm5, %xmm0 561*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm0, %xmm2 562*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: punpckhdq {{.*#+}} xmm2 = xmm2[2],xmm1[2],xmm2[3],xmm1[3] 563*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psadbw %xmm1, %xmm2 564*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: punpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 565*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psadbw %xmm1, %xmm0 566*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: packuswb %xmm2, %xmm0 567*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: retq 568*9880d681SAndroid Build Coastguard Worker; 569*9880d681SAndroid Build Coastguard Worker; AVX1-LABEL: testv4i32u: 570*9880d681SAndroid Build Coastguard Worker; AVX1: # BB#0: 571*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpxor %xmm1, %xmm1, %xmm1 572*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsubd %xmm0, %xmm1, %xmm2 573*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm2, %xmm0, %xmm0 574*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsubd {{.*}}(%rip), %xmm0, %xmm0 575*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovdqa {{.*#+}} xmm2 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 576*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm2, %xmm0, %xmm3 577*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovdqa {{.*#+}} xmm4 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 578*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpshufb %xmm3, %xmm4, %xmm3 579*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsrlw $4, %xmm0, %xmm0 580*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm2, %xmm0, %xmm0 581*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpshufb %xmm0, %xmm4, %xmm0 582*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpaddb %xmm3, %xmm0, %xmm0 583*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpunpckhdq {{.*#+}} xmm2 = xmm0[2],xmm1[2],xmm0[3],xmm1[3] 584*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsadbw %xmm1, %xmm2, %xmm2 585*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpunpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 586*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsadbw %xmm1, %xmm0, %xmm0 587*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpackuswb %xmm2, %xmm0, %xmm0 588*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: retq 589*9880d681SAndroid Build Coastguard Worker; 590*9880d681SAndroid Build Coastguard Worker; AVX2-LABEL: testv4i32u: 591*9880d681SAndroid Build Coastguard Worker; AVX2: # BB#0: 592*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpxor %xmm1, %xmm1, %xmm1 593*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsubd %xmm0, %xmm1, %xmm2 594*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm2, %xmm0, %xmm0 595*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpbroadcastd {{.*}}(%rip), %xmm2 596*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsubd %xmm2, %xmm0, %xmm0 597*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovdqa {{.*#+}} xmm2 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 598*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm2, %xmm0, %xmm3 599*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovdqa {{.*#+}} xmm4 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 600*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpshufb %xmm3, %xmm4, %xmm3 601*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsrlw $4, %xmm0, %xmm0 602*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm2, %xmm0, %xmm0 603*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpshufb %xmm0, %xmm4, %xmm0 604*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpaddb %xmm3, %xmm0, %xmm0 605*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpunpckhdq {{.*#+}} xmm2 = xmm0[2],xmm1[2],xmm0[3],xmm1[3] 606*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsadbw %xmm1, %xmm2, %xmm2 607*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpunpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 608*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsadbw %xmm1, %xmm0, %xmm0 609*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpackuswb %xmm2, %xmm0, %xmm0 610*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: retq 611*9880d681SAndroid Build Coastguard Worker; 612*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-LABEL: testv4i32u: 613*9880d681SAndroid Build Coastguard Worker; AVX512CDVL: # BB#0: 614*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpxord %xmm1, %xmm1, %xmm1 615*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubd %xmm0, %xmm1, %xmm1 616*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandd %xmm1, %xmm0, %xmm0 617*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vplzcntd %xmm0, %xmm0 618*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpbroadcastd {{.*}}(%rip), %xmm1 619*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubd %xmm0, %xmm1, %xmm0 620*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: retq 621*9880d681SAndroid Build Coastguard Worker; 622*9880d681SAndroid Build Coastguard Worker; AVX512CD-LABEL: testv4i32u: 623*9880d681SAndroid Build Coastguard Worker; AVX512CD: # BB#0: 624*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpxor %xmm1, %xmm1, %xmm1 625*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubd %xmm0, %xmm1, %xmm1 626*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm0 627*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vplzcntd %zmm0, %zmm0 628*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpbroadcastd {{.*}}(%rip), %xmm1 629*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubd %xmm0, %xmm1, %xmm0 630*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: retq 631*9880d681SAndroid Build Coastguard Worker; 632*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: testv4i32u: 633*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 634*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pxor %xmm1, %xmm1 635*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pxor %xmm2, %xmm2 636*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psubd %xmm0, %xmm2 637*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm0, %xmm2 638*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psubd {{\.LCPI.*}}, %xmm2 639*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa {{.*#+}} xmm3 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 640*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm2, %xmm4 641*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm3, %xmm4 642*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa {{.*#+}} xmm0 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 643*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm0, %xmm5 644*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pshufb %xmm4, %xmm5 645*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psrlw $4, %xmm2 646*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm3, %xmm2 647*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pshufb %xmm2, %xmm0 648*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: paddb %xmm5, %xmm0 649*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm0, %xmm2 650*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: punpckhdq {{.*#+}} xmm2 = xmm2[2],xmm1[2],xmm2[3],xmm1[3] 651*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psadbw %xmm1, %xmm2 652*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: punpckldq {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1] 653*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psadbw %xmm1, %xmm0 654*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: packuswb %xmm2, %xmm0 655*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 656*9880d681SAndroid Build Coastguard Worker %out = call <4 x i32> @llvm.cttz.v4i32(<4 x i32> %in, i1 -1) 657*9880d681SAndroid Build Coastguard Worker ret <4 x i32> %out 658*9880d681SAndroid Build Coastguard Worker} 659*9880d681SAndroid Build Coastguard Worker 660*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @testv8i16(<8 x i16> %in) nounwind { 661*9880d681SAndroid Build Coastguard Worker; SSE2-LABEL: testv8i16: 662*9880d681SAndroid Build Coastguard Worker; SSE2: # BB#0: 663*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pxor %xmm1, %xmm1 664*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubw %xmm0, %xmm1 665*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm1 666*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubw {{.*}}(%rip), %xmm1 667*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm0 668*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $1, %xmm0 669*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand {{.*}}(%rip), %xmm0 670*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubw %xmm0, %xmm1 671*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa {{.*#+}} xmm0 = [13107,13107,13107,13107,13107,13107,13107,13107] 672*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm2 673*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm2 674*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $2, %xmm1 675*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm1 676*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddw %xmm2, %xmm1 677*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm2 678*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $4, %xmm2 679*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddw %xmm1, %xmm2 680*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand {{.*}}(%rip), %xmm2 681*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm2, %xmm0 682*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psllw $8, %xmm0 683*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddb %xmm2, %xmm0 684*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $8, %xmm0 685*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: retq 686*9880d681SAndroid Build Coastguard Worker; 687*9880d681SAndroid Build Coastguard Worker; SSE3-LABEL: testv8i16: 688*9880d681SAndroid Build Coastguard Worker; SSE3: # BB#0: 689*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pxor %xmm1, %xmm1 690*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubw %xmm0, %xmm1 691*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm1 692*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubw {{.*}}(%rip), %xmm1 693*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm0 694*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $1, %xmm0 695*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand {{.*}}(%rip), %xmm0 696*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubw %xmm0, %xmm1 697*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa {{.*#+}} xmm0 = [13107,13107,13107,13107,13107,13107,13107,13107] 698*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm2 699*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm2 700*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $2, %xmm1 701*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm1 702*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddw %xmm2, %xmm1 703*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm2 704*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $4, %xmm2 705*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddw %xmm1, %xmm2 706*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand {{.*}}(%rip), %xmm2 707*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm2, %xmm0 708*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psllw $8, %xmm0 709*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddb %xmm2, %xmm0 710*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $8, %xmm0 711*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: retq 712*9880d681SAndroid Build Coastguard Worker; 713*9880d681SAndroid Build Coastguard Worker; SSSE3-LABEL: testv8i16: 714*9880d681SAndroid Build Coastguard Worker; SSSE3: # BB#0: 715*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pxor %xmm1, %xmm1 716*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psubw %xmm0, %xmm1 717*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm0, %xmm1 718*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psubw {{.*}}(%rip), %xmm1 719*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa {{.*#+}} xmm0 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 720*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm1, %xmm2 721*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm0, %xmm2 722*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 723*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm3, %xmm4 724*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufb %xmm2, %xmm4 725*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psrlw $4, %xmm1 726*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm0, %xmm1 727*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufb %xmm1, %xmm3 728*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: paddb %xmm4, %xmm3 729*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm3, %xmm0 730*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psllw $8, %xmm0 731*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: paddb %xmm3, %xmm0 732*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psrlw $8, %xmm0 733*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: retq 734*9880d681SAndroid Build Coastguard Worker; 735*9880d681SAndroid Build Coastguard Worker; SSE41-LABEL: testv8i16: 736*9880d681SAndroid Build Coastguard Worker; SSE41: # BB#0: 737*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pxor %xmm1, %xmm1 738*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psubw %xmm0, %xmm1 739*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm0, %xmm1 740*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psubw {{.*}}(%rip), %xmm1 741*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa {{.*#+}} xmm0 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 742*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm1, %xmm2 743*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm0, %xmm2 744*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 745*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm3, %xmm4 746*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pshufb %xmm2, %xmm4 747*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psrlw $4, %xmm1 748*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm0, %xmm1 749*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pshufb %xmm1, %xmm3 750*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: paddb %xmm4, %xmm3 751*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm3, %xmm0 752*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psllw $8, %xmm0 753*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: paddb %xmm3, %xmm0 754*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psrlw $8, %xmm0 755*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: retq 756*9880d681SAndroid Build Coastguard Worker; 757*9880d681SAndroid Build Coastguard Worker; AVX1-LABEL: testv8i16: 758*9880d681SAndroid Build Coastguard Worker; AVX1: # BB#0: 759*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpxor %xmm1, %xmm1, %xmm1 760*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsubw %xmm0, %xmm1, %xmm1 761*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm1, %xmm0, %xmm0 762*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsubw {{.*}}(%rip), %xmm0, %xmm0 763*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 764*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm1, %xmm0, %xmm2 765*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 766*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpshufb %xmm2, %xmm3, %xmm2 767*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsrlw $4, %xmm0, %xmm0 768*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm1, %xmm0, %xmm0 769*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpshufb %xmm0, %xmm3, %xmm0 770*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpaddb %xmm2, %xmm0, %xmm0 771*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsllw $8, %xmm0, %xmm1 772*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpaddb %xmm0, %xmm1, %xmm0 773*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsrlw $8, %xmm0, %xmm0 774*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: retq 775*9880d681SAndroid Build Coastguard Worker; 776*9880d681SAndroid Build Coastguard Worker; AVX2-LABEL: testv8i16: 777*9880d681SAndroid Build Coastguard Worker; AVX2: # BB#0: 778*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpxor %xmm1, %xmm1, %xmm1 779*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsubw %xmm0, %xmm1, %xmm1 780*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm1, %xmm0, %xmm0 781*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsubw {{.*}}(%rip), %xmm0, %xmm0 782*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 783*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm1, %xmm0, %xmm2 784*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 785*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpshufb %xmm2, %xmm3, %xmm2 786*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsrlw $4, %xmm0, %xmm0 787*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm1, %xmm0, %xmm0 788*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpshufb %xmm0, %xmm3, %xmm0 789*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpaddb %xmm2, %xmm0, %xmm0 790*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsllw $8, %xmm0, %xmm1 791*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpaddb %xmm0, %xmm1, %xmm0 792*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsrlw $8, %xmm0, %xmm0 793*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: retq 794*9880d681SAndroid Build Coastguard Worker; 795*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-LABEL: testv8i16: 796*9880d681SAndroid Build Coastguard Worker; AVX512CDVL: # BB#0: 797*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpxord %xmm1, %xmm1, %xmm1 798*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubw %xmm0, %xmm1, %xmm1 799*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm1, %xmm0, %xmm0 800*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubw {{.*}}(%rip), %xmm0, %xmm0 801*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 802*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm1, %xmm0, %xmm2 803*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 804*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpshufb %xmm2, %xmm3, %xmm2 805*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsrlw $4, %xmm0, %xmm0 806*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm1, %xmm0, %xmm0 807*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpshufb %xmm0, %xmm3, %xmm0 808*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpaddb %xmm2, %xmm0, %xmm0 809*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsllw $8, %xmm0, %xmm1 810*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpaddb %xmm0, %xmm1, %xmm0 811*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsrlw $8, %xmm0, %xmm0 812*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: retq 813*9880d681SAndroid Build Coastguard Worker; 814*9880d681SAndroid Build Coastguard Worker; AVX512CD-LABEL: testv8i16: 815*9880d681SAndroid Build Coastguard Worker; AVX512CD: # BB#0: 816*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpxor %xmm1, %xmm1, %xmm1 817*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubw %xmm0, %xmm1, %xmm1 818*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm0 819*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubw {{.*}}(%rip), %xmm0, %xmm0 820*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 821*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm2 822*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 823*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpshufb %xmm2, %xmm3, %xmm2 824*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsrlw $4, %xmm0, %xmm0 825*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm0 826*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpshufb %xmm0, %xmm3, %xmm0 827*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpaddb %xmm2, %xmm0, %xmm0 828*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsllw $8, %xmm0, %xmm1 829*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpaddb %xmm0, %xmm1, %xmm0 830*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsrlw $8, %xmm0, %xmm0 831*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: retq 832*9880d681SAndroid Build Coastguard Worker; 833*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: testv8i16: 834*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 835*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pxor %xmm1, %xmm1 836*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psubw %xmm0, %xmm1 837*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm0, %xmm1 838*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psubw {{\.LCPI.*}}, %xmm1 839*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa {{.*#+}} xmm0 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 840*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm1, %xmm2 841*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm0, %xmm2 842*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 843*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm3, %xmm4 844*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pshufb %xmm2, %xmm4 845*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psrlw $4, %xmm1 846*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm0, %xmm1 847*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pshufb %xmm1, %xmm3 848*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: paddb %xmm4, %xmm3 849*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm3, %xmm0 850*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psllw $8, %xmm0 851*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: paddb %xmm3, %xmm0 852*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psrlw $8, %xmm0 853*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 854*9880d681SAndroid Build Coastguard Worker %out = call <8 x i16> @llvm.cttz.v8i16(<8 x i16> %in, i1 0) 855*9880d681SAndroid Build Coastguard Worker ret <8 x i16> %out 856*9880d681SAndroid Build Coastguard Worker} 857*9880d681SAndroid Build Coastguard Worker 858*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @testv8i16u(<8 x i16> %in) nounwind { 859*9880d681SAndroid Build Coastguard Worker; SSE2-LABEL: testv8i16u: 860*9880d681SAndroid Build Coastguard Worker; SSE2: # BB#0: 861*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pxor %xmm1, %xmm1 862*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubw %xmm0, %xmm1 863*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm1 864*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubw {{.*}}(%rip), %xmm1 865*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm0 866*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $1, %xmm0 867*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand {{.*}}(%rip), %xmm0 868*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubw %xmm0, %xmm1 869*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa {{.*#+}} xmm0 = [13107,13107,13107,13107,13107,13107,13107,13107] 870*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm2 871*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm2 872*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $2, %xmm1 873*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm1 874*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddw %xmm2, %xmm1 875*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm2 876*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $4, %xmm2 877*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddw %xmm1, %xmm2 878*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand {{.*}}(%rip), %xmm2 879*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm2, %xmm0 880*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psllw $8, %xmm0 881*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddb %xmm2, %xmm0 882*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $8, %xmm0 883*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: retq 884*9880d681SAndroid Build Coastguard Worker; 885*9880d681SAndroid Build Coastguard Worker; SSE3-LABEL: testv8i16u: 886*9880d681SAndroid Build Coastguard Worker; SSE3: # BB#0: 887*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pxor %xmm1, %xmm1 888*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubw %xmm0, %xmm1 889*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm1 890*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubw {{.*}}(%rip), %xmm1 891*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm0 892*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $1, %xmm0 893*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand {{.*}}(%rip), %xmm0 894*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubw %xmm0, %xmm1 895*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa {{.*#+}} xmm0 = [13107,13107,13107,13107,13107,13107,13107,13107] 896*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm2 897*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm2 898*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $2, %xmm1 899*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm1 900*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddw %xmm2, %xmm1 901*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm2 902*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $4, %xmm2 903*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddw %xmm1, %xmm2 904*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand {{.*}}(%rip), %xmm2 905*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm2, %xmm0 906*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psllw $8, %xmm0 907*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddb %xmm2, %xmm0 908*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $8, %xmm0 909*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: retq 910*9880d681SAndroid Build Coastguard Worker; 911*9880d681SAndroid Build Coastguard Worker; SSSE3-LABEL: testv8i16u: 912*9880d681SAndroid Build Coastguard Worker; SSSE3: # BB#0: 913*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pxor %xmm1, %xmm1 914*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psubw %xmm0, %xmm1 915*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm0, %xmm1 916*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psubw {{.*}}(%rip), %xmm1 917*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa {{.*#+}} xmm0 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 918*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm1, %xmm2 919*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm0, %xmm2 920*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 921*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm3, %xmm4 922*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufb %xmm2, %xmm4 923*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psrlw $4, %xmm1 924*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm0, %xmm1 925*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufb %xmm1, %xmm3 926*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: paddb %xmm4, %xmm3 927*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm3, %xmm0 928*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psllw $8, %xmm0 929*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: paddb %xmm3, %xmm0 930*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psrlw $8, %xmm0 931*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: retq 932*9880d681SAndroid Build Coastguard Worker; 933*9880d681SAndroid Build Coastguard Worker; SSE41-LABEL: testv8i16u: 934*9880d681SAndroid Build Coastguard Worker; SSE41: # BB#0: 935*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pxor %xmm1, %xmm1 936*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psubw %xmm0, %xmm1 937*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm0, %xmm1 938*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psubw {{.*}}(%rip), %xmm1 939*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa {{.*#+}} xmm0 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 940*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm1, %xmm2 941*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm0, %xmm2 942*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 943*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm3, %xmm4 944*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pshufb %xmm2, %xmm4 945*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psrlw $4, %xmm1 946*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm0, %xmm1 947*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pshufb %xmm1, %xmm3 948*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: paddb %xmm4, %xmm3 949*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm3, %xmm0 950*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psllw $8, %xmm0 951*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: paddb %xmm3, %xmm0 952*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psrlw $8, %xmm0 953*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: retq 954*9880d681SAndroid Build Coastguard Worker; 955*9880d681SAndroid Build Coastguard Worker; AVX1-LABEL: testv8i16u: 956*9880d681SAndroid Build Coastguard Worker; AVX1: # BB#0: 957*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpxor %xmm1, %xmm1, %xmm1 958*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsubw %xmm0, %xmm1, %xmm1 959*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm1, %xmm0, %xmm0 960*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsubw {{.*}}(%rip), %xmm0, %xmm0 961*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 962*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm1, %xmm0, %xmm2 963*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 964*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpshufb %xmm2, %xmm3, %xmm2 965*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsrlw $4, %xmm0, %xmm0 966*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm1, %xmm0, %xmm0 967*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpshufb %xmm0, %xmm3, %xmm0 968*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpaddb %xmm2, %xmm0, %xmm0 969*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsllw $8, %xmm0, %xmm1 970*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpaddb %xmm0, %xmm1, %xmm0 971*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsrlw $8, %xmm0, %xmm0 972*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: retq 973*9880d681SAndroid Build Coastguard Worker; 974*9880d681SAndroid Build Coastguard Worker; AVX2-LABEL: testv8i16u: 975*9880d681SAndroid Build Coastguard Worker; AVX2: # BB#0: 976*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpxor %xmm1, %xmm1, %xmm1 977*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsubw %xmm0, %xmm1, %xmm1 978*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm1, %xmm0, %xmm0 979*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsubw {{.*}}(%rip), %xmm0, %xmm0 980*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 981*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm1, %xmm0, %xmm2 982*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 983*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpshufb %xmm2, %xmm3, %xmm2 984*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsrlw $4, %xmm0, %xmm0 985*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm1, %xmm0, %xmm0 986*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpshufb %xmm0, %xmm3, %xmm0 987*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpaddb %xmm2, %xmm0, %xmm0 988*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsllw $8, %xmm0, %xmm1 989*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpaddb %xmm0, %xmm1, %xmm0 990*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsrlw $8, %xmm0, %xmm0 991*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: retq 992*9880d681SAndroid Build Coastguard Worker; 993*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-LABEL: testv8i16u: 994*9880d681SAndroid Build Coastguard Worker; AVX512CDVL: # BB#0: 995*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpxord %xmm1, %xmm1, %xmm1 996*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubw %xmm0, %xmm1, %xmm1 997*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm1, %xmm0, %xmm0 998*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubw {{.*}}(%rip), %xmm0, %xmm0 999*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1000*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm1, %xmm0, %xmm2 1001*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1002*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpshufb %xmm2, %xmm3, %xmm2 1003*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsrlw $4, %xmm0, %xmm0 1004*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm1, %xmm0, %xmm0 1005*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpshufb %xmm0, %xmm3, %xmm0 1006*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpaddb %xmm2, %xmm0, %xmm0 1007*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsllw $8, %xmm0, %xmm1 1008*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpaddb %xmm0, %xmm1, %xmm0 1009*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsrlw $8, %xmm0, %xmm0 1010*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: retq 1011*9880d681SAndroid Build Coastguard Worker; 1012*9880d681SAndroid Build Coastguard Worker; AVX512CD-LABEL: testv8i16u: 1013*9880d681SAndroid Build Coastguard Worker; AVX512CD: # BB#0: 1014*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpxor %xmm1, %xmm1, %xmm1 1015*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubw %xmm0, %xmm1, %xmm1 1016*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm0 1017*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubw {{.*}}(%rip), %xmm0, %xmm0 1018*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1019*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm2 1020*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1021*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpshufb %xmm2, %xmm3, %xmm2 1022*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsrlw $4, %xmm0, %xmm0 1023*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm0 1024*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpshufb %xmm0, %xmm3, %xmm0 1025*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpaddb %xmm2, %xmm0, %xmm0 1026*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsllw $8, %xmm0, %xmm1 1027*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpaddb %xmm0, %xmm1, %xmm0 1028*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsrlw $8, %xmm0, %xmm0 1029*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: retq 1030*9880d681SAndroid Build Coastguard Worker; 1031*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: testv8i16u: 1032*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 1033*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pxor %xmm1, %xmm1 1034*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psubw %xmm0, %xmm1 1035*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm0, %xmm1 1036*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psubw {{\.LCPI.*}}, %xmm1 1037*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa {{.*#+}} xmm0 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1038*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm1, %xmm2 1039*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm0, %xmm2 1040*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1041*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm3, %xmm4 1042*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pshufb %xmm2, %xmm4 1043*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psrlw $4, %xmm1 1044*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm0, %xmm1 1045*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pshufb %xmm1, %xmm3 1046*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: paddb %xmm4, %xmm3 1047*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm3, %xmm0 1048*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psllw $8, %xmm0 1049*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: paddb %xmm3, %xmm0 1050*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psrlw $8, %xmm0 1051*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 1052*9880d681SAndroid Build Coastguard Worker %out = call <8 x i16> @llvm.cttz.v8i16(<8 x i16> %in, i1 -1) 1053*9880d681SAndroid Build Coastguard Worker ret <8 x i16> %out 1054*9880d681SAndroid Build Coastguard Worker} 1055*9880d681SAndroid Build Coastguard Worker 1056*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @testv16i8(<16 x i8> %in) nounwind { 1057*9880d681SAndroid Build Coastguard Worker; SSE2-LABEL: testv16i8: 1058*9880d681SAndroid Build Coastguard Worker; SSE2: # BB#0: 1059*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pxor %xmm1, %xmm1 1060*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubb %xmm0, %xmm1 1061*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm1 1062*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubb {{.*}}(%rip), %xmm1 1063*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm0 1064*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $1, %xmm0 1065*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand {{.*}}(%rip), %xmm0 1066*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubb %xmm0, %xmm1 1067*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa {{.*#+}} xmm0 = [51,51,51,51,51,51,51,51,51,51,51,51,51,51,51,51] 1068*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm2 1069*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm2 1070*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $2, %xmm1 1071*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm1 1072*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddb %xmm2, %xmm1 1073*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm0 1074*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $4, %xmm0 1075*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddb %xmm1, %xmm0 1076*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand {{.*}}(%rip), %xmm0 1077*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: retq 1078*9880d681SAndroid Build Coastguard Worker; 1079*9880d681SAndroid Build Coastguard Worker; SSE3-LABEL: testv16i8: 1080*9880d681SAndroid Build Coastguard Worker; SSE3: # BB#0: 1081*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pxor %xmm1, %xmm1 1082*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubb %xmm0, %xmm1 1083*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm1 1084*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubb {{.*}}(%rip), %xmm1 1085*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm0 1086*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $1, %xmm0 1087*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand {{.*}}(%rip), %xmm0 1088*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubb %xmm0, %xmm1 1089*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa {{.*#+}} xmm0 = [51,51,51,51,51,51,51,51,51,51,51,51,51,51,51,51] 1090*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm2 1091*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm2 1092*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $2, %xmm1 1093*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm1 1094*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddb %xmm2, %xmm1 1095*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm0 1096*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $4, %xmm0 1097*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddb %xmm1, %xmm0 1098*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand {{.*}}(%rip), %xmm0 1099*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: retq 1100*9880d681SAndroid Build Coastguard Worker; 1101*9880d681SAndroid Build Coastguard Worker; SSSE3-LABEL: testv16i8: 1102*9880d681SAndroid Build Coastguard Worker; SSSE3: # BB#0: 1103*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pxor %xmm1, %xmm1 1104*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psubb %xmm0, %xmm1 1105*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm0, %xmm1 1106*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psubb {{.*}}(%rip), %xmm1 1107*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa {{.*#+}} xmm2 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1108*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm1, %xmm3 1109*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm2, %xmm3 1110*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa {{.*#+}} xmm0 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1111*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm0, %xmm4 1112*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufb %xmm3, %xmm4 1113*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psrlw $4, %xmm1 1114*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm2, %xmm1 1115*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufb %xmm1, %xmm0 1116*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: paddb %xmm4, %xmm0 1117*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: retq 1118*9880d681SAndroid Build Coastguard Worker; 1119*9880d681SAndroid Build Coastguard Worker; SSE41-LABEL: testv16i8: 1120*9880d681SAndroid Build Coastguard Worker; SSE41: # BB#0: 1121*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pxor %xmm1, %xmm1 1122*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psubb %xmm0, %xmm1 1123*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm0, %xmm1 1124*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psubb {{.*}}(%rip), %xmm1 1125*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa {{.*#+}} xmm2 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1126*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm1, %xmm3 1127*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm2, %xmm3 1128*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa {{.*#+}} xmm0 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1129*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm0, %xmm4 1130*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pshufb %xmm3, %xmm4 1131*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psrlw $4, %xmm1 1132*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm2, %xmm1 1133*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pshufb %xmm1, %xmm0 1134*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: paddb %xmm4, %xmm0 1135*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: retq 1136*9880d681SAndroid Build Coastguard Worker; 1137*9880d681SAndroid Build Coastguard Worker; AVX1-LABEL: testv16i8: 1138*9880d681SAndroid Build Coastguard Worker; AVX1: # BB#0: 1139*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpxor %xmm1, %xmm1, %xmm1 1140*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsubb %xmm0, %xmm1, %xmm1 1141*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm1, %xmm0, %xmm0 1142*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsubb {{.*}}(%rip), %xmm0, %xmm0 1143*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1144*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm1, %xmm0, %xmm2 1145*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1146*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpshufb %xmm2, %xmm3, %xmm2 1147*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsrlw $4, %xmm0, %xmm0 1148*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm1, %xmm0, %xmm0 1149*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpshufb %xmm0, %xmm3, %xmm0 1150*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpaddb %xmm2, %xmm0, %xmm0 1151*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: retq 1152*9880d681SAndroid Build Coastguard Worker; 1153*9880d681SAndroid Build Coastguard Worker; AVX2-LABEL: testv16i8: 1154*9880d681SAndroid Build Coastguard Worker; AVX2: # BB#0: 1155*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpxor %xmm1, %xmm1, %xmm1 1156*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsubb %xmm0, %xmm1, %xmm1 1157*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm1, %xmm0, %xmm0 1158*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsubb {{.*}}(%rip), %xmm0, %xmm0 1159*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1160*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm1, %xmm0, %xmm2 1161*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1162*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpshufb %xmm2, %xmm3, %xmm2 1163*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsrlw $4, %xmm0, %xmm0 1164*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm1, %xmm0, %xmm0 1165*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpshufb %xmm0, %xmm3, %xmm0 1166*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpaddb %xmm2, %xmm0, %xmm0 1167*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: retq 1168*9880d681SAndroid Build Coastguard Worker; 1169*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-LABEL: testv16i8: 1170*9880d681SAndroid Build Coastguard Worker; AVX512CDVL: # BB#0: 1171*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpxord %xmm1, %xmm1, %xmm1 1172*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubb %xmm0, %xmm1, %xmm1 1173*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm1, %xmm0, %xmm0 1174*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubb {{.*}}(%rip), %xmm0, %xmm0 1175*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1176*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm1, %xmm0, %xmm2 1177*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1178*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpshufb %xmm2, %xmm3, %xmm2 1179*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsrlw $4, %xmm0, %xmm0 1180*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm1, %xmm0, %xmm0 1181*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpshufb %xmm0, %xmm3, %xmm0 1182*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpaddb %xmm2, %xmm0, %xmm0 1183*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: retq 1184*9880d681SAndroid Build Coastguard Worker; 1185*9880d681SAndroid Build Coastguard Worker; AVX512CD-LABEL: testv16i8: 1186*9880d681SAndroid Build Coastguard Worker; AVX512CD: # BB#0: 1187*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpxor %xmm1, %xmm1, %xmm1 1188*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubb %xmm0, %xmm1, %xmm1 1189*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm0 1190*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubb {{.*}}(%rip), %xmm0, %xmm0 1191*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1192*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm2 1193*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1194*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpshufb %xmm2, %xmm3, %xmm2 1195*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsrlw $4, %xmm0, %xmm0 1196*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm0 1197*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpshufb %xmm0, %xmm3, %xmm0 1198*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpaddb %xmm2, %xmm0, %xmm0 1199*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: retq 1200*9880d681SAndroid Build Coastguard Worker; 1201*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: testv16i8: 1202*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 1203*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pxor %xmm1, %xmm1 1204*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psubb %xmm0, %xmm1 1205*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm0, %xmm1 1206*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psubb {{\.LCPI.*}}, %xmm1 1207*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa {{.*#+}} xmm2 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1208*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm1, %xmm3 1209*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm2, %xmm3 1210*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa {{.*#+}} xmm0 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1211*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm0, %xmm4 1212*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pshufb %xmm3, %xmm4 1213*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psrlw $4, %xmm1 1214*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm2, %xmm1 1215*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pshufb %xmm1, %xmm0 1216*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: paddb %xmm4, %xmm0 1217*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 1218*9880d681SAndroid Build Coastguard Worker %out = call <16 x i8> @llvm.cttz.v16i8(<16 x i8> %in, i1 0) 1219*9880d681SAndroid Build Coastguard Worker ret <16 x i8> %out 1220*9880d681SAndroid Build Coastguard Worker} 1221*9880d681SAndroid Build Coastguard Worker 1222*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @testv16i8u(<16 x i8> %in) nounwind { 1223*9880d681SAndroid Build Coastguard Worker; SSE2-LABEL: testv16i8u: 1224*9880d681SAndroid Build Coastguard Worker; SSE2: # BB#0: 1225*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pxor %xmm1, %xmm1 1226*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubb %xmm0, %xmm1 1227*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm1 1228*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubb {{.*}}(%rip), %xmm1 1229*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm0 1230*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $1, %xmm0 1231*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand {{.*}}(%rip), %xmm0 1232*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psubb %xmm0, %xmm1 1233*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa {{.*#+}} xmm0 = [51,51,51,51,51,51,51,51,51,51,51,51,51,51,51,51] 1234*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm2 1235*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm2 1236*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $2, %xmm1 1237*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand %xmm0, %xmm1 1238*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddb %xmm2, %xmm1 1239*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: movdqa %xmm1, %xmm0 1240*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: psrlw $4, %xmm0 1241*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: paddb %xmm1, %xmm0 1242*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: pand {{.*}}(%rip), %xmm0 1243*9880d681SAndroid Build Coastguard Worker; SSE2-NEXT: retq 1244*9880d681SAndroid Build Coastguard Worker; 1245*9880d681SAndroid Build Coastguard Worker; SSE3-LABEL: testv16i8u: 1246*9880d681SAndroid Build Coastguard Worker; SSE3: # BB#0: 1247*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pxor %xmm1, %xmm1 1248*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubb %xmm0, %xmm1 1249*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm1 1250*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubb {{.*}}(%rip), %xmm1 1251*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm0 1252*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $1, %xmm0 1253*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand {{.*}}(%rip), %xmm0 1254*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psubb %xmm0, %xmm1 1255*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa {{.*#+}} xmm0 = [51,51,51,51,51,51,51,51,51,51,51,51,51,51,51,51] 1256*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm2 1257*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm2 1258*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $2, %xmm1 1259*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand %xmm0, %xmm1 1260*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddb %xmm2, %xmm1 1261*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: movdqa %xmm1, %xmm0 1262*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: psrlw $4, %xmm0 1263*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: paddb %xmm1, %xmm0 1264*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: pand {{.*}}(%rip), %xmm0 1265*9880d681SAndroid Build Coastguard Worker; SSE3-NEXT: retq 1266*9880d681SAndroid Build Coastguard Worker; 1267*9880d681SAndroid Build Coastguard Worker; SSSE3-LABEL: testv16i8u: 1268*9880d681SAndroid Build Coastguard Worker; SSSE3: # BB#0: 1269*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pxor %xmm1, %xmm1 1270*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psubb %xmm0, %xmm1 1271*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm0, %xmm1 1272*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psubb {{.*}}(%rip), %xmm1 1273*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa {{.*#+}} xmm2 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1274*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm1, %xmm3 1275*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm2, %xmm3 1276*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa {{.*#+}} xmm0 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1277*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: movdqa %xmm0, %xmm4 1278*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufb %xmm3, %xmm4 1279*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: psrlw $4, %xmm1 1280*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pand %xmm2, %xmm1 1281*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: pshufb %xmm1, %xmm0 1282*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: paddb %xmm4, %xmm0 1283*9880d681SAndroid Build Coastguard Worker; SSSE3-NEXT: retq 1284*9880d681SAndroid Build Coastguard Worker; 1285*9880d681SAndroid Build Coastguard Worker; SSE41-LABEL: testv16i8u: 1286*9880d681SAndroid Build Coastguard Worker; SSE41: # BB#0: 1287*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pxor %xmm1, %xmm1 1288*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psubb %xmm0, %xmm1 1289*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm0, %xmm1 1290*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psubb {{.*}}(%rip), %xmm1 1291*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa {{.*#+}} xmm2 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1292*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm1, %xmm3 1293*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm2, %xmm3 1294*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa {{.*#+}} xmm0 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1295*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: movdqa %xmm0, %xmm4 1296*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pshufb %xmm3, %xmm4 1297*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: psrlw $4, %xmm1 1298*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pand %xmm2, %xmm1 1299*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: pshufb %xmm1, %xmm0 1300*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: paddb %xmm4, %xmm0 1301*9880d681SAndroid Build Coastguard Worker; SSE41-NEXT: retq 1302*9880d681SAndroid Build Coastguard Worker; 1303*9880d681SAndroid Build Coastguard Worker; AVX1-LABEL: testv16i8u: 1304*9880d681SAndroid Build Coastguard Worker; AVX1: # BB#0: 1305*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpxor %xmm1, %xmm1, %xmm1 1306*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsubb %xmm0, %xmm1, %xmm1 1307*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm1, %xmm0, %xmm0 1308*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsubb {{.*}}(%rip), %xmm0, %xmm0 1309*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1310*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm1, %xmm0, %xmm2 1311*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1312*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpshufb %xmm2, %xmm3, %xmm2 1313*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpsrlw $4, %xmm0, %xmm0 1314*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpand %xmm1, %xmm0, %xmm0 1315*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpshufb %xmm0, %xmm3, %xmm0 1316*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vpaddb %xmm2, %xmm0, %xmm0 1317*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: retq 1318*9880d681SAndroid Build Coastguard Worker; 1319*9880d681SAndroid Build Coastguard Worker; AVX2-LABEL: testv16i8u: 1320*9880d681SAndroid Build Coastguard Worker; AVX2: # BB#0: 1321*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpxor %xmm1, %xmm1, %xmm1 1322*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsubb %xmm0, %xmm1, %xmm1 1323*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm1, %xmm0, %xmm0 1324*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsubb {{.*}}(%rip), %xmm0, %xmm0 1325*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1326*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm1, %xmm0, %xmm2 1327*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1328*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpshufb %xmm2, %xmm3, %xmm2 1329*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpsrlw $4, %xmm0, %xmm0 1330*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpand %xmm1, %xmm0, %xmm0 1331*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpshufb %xmm0, %xmm3, %xmm0 1332*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vpaddb %xmm2, %xmm0, %xmm0 1333*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: retq 1334*9880d681SAndroid Build Coastguard Worker; 1335*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-LABEL: testv16i8u: 1336*9880d681SAndroid Build Coastguard Worker; AVX512CDVL: # BB#0: 1337*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpxord %xmm1, %xmm1, %xmm1 1338*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubb %xmm0, %xmm1, %xmm1 1339*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm1, %xmm0, %xmm0 1340*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsubb {{.*}}(%rip), %xmm0, %xmm0 1341*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1342*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm1, %xmm0, %xmm2 1343*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1344*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpshufb %xmm2, %xmm3, %xmm2 1345*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpsrlw $4, %xmm0, %xmm0 1346*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpandq %xmm1, %xmm0, %xmm0 1347*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpshufb %xmm0, %xmm3, %xmm0 1348*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vpaddb %xmm2, %xmm0, %xmm0 1349*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: retq 1350*9880d681SAndroid Build Coastguard Worker; 1351*9880d681SAndroid Build Coastguard Worker; AVX512CD-LABEL: testv16i8u: 1352*9880d681SAndroid Build Coastguard Worker; AVX512CD: # BB#0: 1353*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpxor %xmm1, %xmm1, %xmm1 1354*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubb %xmm0, %xmm1, %xmm1 1355*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm0 1356*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsubb {{.*}}(%rip), %xmm0, %xmm0 1357*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1358*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm2 1359*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1360*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpshufb %xmm2, %xmm3, %xmm2 1361*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpsrlw $4, %xmm0, %xmm0 1362*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpand %xmm1, %xmm0, %xmm0 1363*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpshufb %xmm0, %xmm3, %xmm0 1364*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vpaddb %xmm2, %xmm0, %xmm0 1365*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: retq 1366*9880d681SAndroid Build Coastguard Worker; 1367*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: testv16i8u: 1368*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 1369*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pxor %xmm1, %xmm1 1370*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psubb %xmm0, %xmm1 1371*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm0, %xmm1 1372*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psubb {{\.LCPI.*}}, %xmm1 1373*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa {{.*#+}} xmm2 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 1374*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm1, %xmm3 1375*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm2, %xmm3 1376*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa {{.*#+}} xmm0 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4] 1377*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movdqa %xmm0, %xmm4 1378*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pshufb %xmm3, %xmm4 1379*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: psrlw $4, %xmm1 1380*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pand %xmm2, %xmm1 1381*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: pshufb %xmm1, %xmm0 1382*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: paddb %xmm4, %xmm0 1383*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 1384*9880d681SAndroid Build Coastguard Worker %out = call <16 x i8> @llvm.cttz.v16i8(<16 x i8> %in, i1 -1) 1385*9880d681SAndroid Build Coastguard Worker ret <16 x i8> %out 1386*9880d681SAndroid Build Coastguard Worker} 1387*9880d681SAndroid Build Coastguard Worker 1388*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @foldv2i64() nounwind { 1389*9880d681SAndroid Build Coastguard Worker; SSE-LABEL: foldv2i64: 1390*9880d681SAndroid Build Coastguard Worker; SSE: # BB#0: 1391*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: movl $8, %eax 1392*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: movd %rax, %xmm0 1393*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: retq 1394*9880d681SAndroid Build Coastguard Worker; 1395*9880d681SAndroid Build Coastguard Worker; AVX-LABEL: foldv2i64: 1396*9880d681SAndroid Build Coastguard Worker; AVX: # BB#0: 1397*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: movl $8, %eax 1398*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: vmovq %rax, %xmm0 1399*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: retq 1400*9880d681SAndroid Build Coastguard Worker; 1401*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: foldv2i64: 1402*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 1403*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movl $8, %eax 1404*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movd %eax, %xmm0 1405*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 1406*9880d681SAndroid Build Coastguard Worker %out = call <2 x i64> @llvm.cttz.v2i64(<2 x i64> <i64 256, i64 -1>, i1 0) 1407*9880d681SAndroid Build Coastguard Worker ret <2 x i64> %out 1408*9880d681SAndroid Build Coastguard Worker} 1409*9880d681SAndroid Build Coastguard Worker 1410*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @foldv2i64u() nounwind { 1411*9880d681SAndroid Build Coastguard Worker; SSE-LABEL: foldv2i64u: 1412*9880d681SAndroid Build Coastguard Worker; SSE: # BB#0: 1413*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: movl $8, %eax 1414*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: movd %rax, %xmm0 1415*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: retq 1416*9880d681SAndroid Build Coastguard Worker; 1417*9880d681SAndroid Build Coastguard Worker; AVX-LABEL: foldv2i64u: 1418*9880d681SAndroid Build Coastguard Worker; AVX: # BB#0: 1419*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: movl $8, %eax 1420*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: vmovq %rax, %xmm0 1421*9880d681SAndroid Build Coastguard Worker; AVX-NEXT: retq 1422*9880d681SAndroid Build Coastguard Worker; 1423*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: foldv2i64u: 1424*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 1425*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movl $8, %eax 1426*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movd %eax, %xmm0 1427*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 1428*9880d681SAndroid Build Coastguard Worker %out = call <2 x i64> @llvm.cttz.v2i64(<2 x i64> <i64 256, i64 -1>, i1 -1) 1429*9880d681SAndroid Build Coastguard Worker ret <2 x i64> %out 1430*9880d681SAndroid Build Coastguard Worker} 1431*9880d681SAndroid Build Coastguard Worker 1432*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @foldv4i32() nounwind { 1433*9880d681SAndroid Build Coastguard Worker; SSE-LABEL: foldv4i32: 1434*9880d681SAndroid Build Coastguard Worker; SSE: # BB#0: 1435*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: movaps {{.*#+}} xmm0 = [8,0,32,0] 1436*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: retq 1437*9880d681SAndroid Build Coastguard Worker; 1438*9880d681SAndroid Build Coastguard Worker; AVX1-LABEL: foldv4i32: 1439*9880d681SAndroid Build Coastguard Worker; AVX1: # BB#0: 1440*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,32,0] 1441*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: retq 1442*9880d681SAndroid Build Coastguard Worker; 1443*9880d681SAndroid Build Coastguard Worker; AVX2-LABEL: foldv4i32: 1444*9880d681SAndroid Build Coastguard Worker; AVX2: # BB#0: 1445*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,32,0] 1446*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: retq 1447*9880d681SAndroid Build Coastguard Worker; 1448*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-LABEL: foldv4i32: 1449*9880d681SAndroid Build Coastguard Worker; AVX512CDVL: # BB#0: 1450*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa32 {{.*#+}} xmm0 = [8,0,32,0] 1451*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: retq 1452*9880d681SAndroid Build Coastguard Worker; 1453*9880d681SAndroid Build Coastguard Worker; AVX512CD-LABEL: foldv4i32: 1454*9880d681SAndroid Build Coastguard Worker; AVX512CD: # BB#0: 1455*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,32,0] 1456*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: retq 1457*9880d681SAndroid Build Coastguard Worker; 1458*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: foldv4i32: 1459*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 1460*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movaps {{.*#+}} xmm0 = [8,0,32,0] 1461*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 1462*9880d681SAndroid Build Coastguard Worker %out = call <4 x i32> @llvm.cttz.v4i32(<4 x i32> <i32 256, i32 -1, i32 0, i32 255>, i1 0) 1463*9880d681SAndroid Build Coastguard Worker ret <4 x i32> %out 1464*9880d681SAndroid Build Coastguard Worker} 1465*9880d681SAndroid Build Coastguard Worker 1466*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @foldv4i32u() nounwind { 1467*9880d681SAndroid Build Coastguard Worker; SSE-LABEL: foldv4i32u: 1468*9880d681SAndroid Build Coastguard Worker; SSE: # BB#0: 1469*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: movaps {{.*#+}} xmm0 = [8,0,32,0] 1470*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: retq 1471*9880d681SAndroid Build Coastguard Worker; 1472*9880d681SAndroid Build Coastguard Worker; AVX1-LABEL: foldv4i32u: 1473*9880d681SAndroid Build Coastguard Worker; AVX1: # BB#0: 1474*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,32,0] 1475*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: retq 1476*9880d681SAndroid Build Coastguard Worker; 1477*9880d681SAndroid Build Coastguard Worker; AVX2-LABEL: foldv4i32u: 1478*9880d681SAndroid Build Coastguard Worker; AVX2: # BB#0: 1479*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,32,0] 1480*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: retq 1481*9880d681SAndroid Build Coastguard Worker; 1482*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-LABEL: foldv4i32u: 1483*9880d681SAndroid Build Coastguard Worker; AVX512CDVL: # BB#0: 1484*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa32 {{.*#+}} xmm0 = [8,0,32,0] 1485*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: retq 1486*9880d681SAndroid Build Coastguard Worker; 1487*9880d681SAndroid Build Coastguard Worker; AVX512CD-LABEL: foldv4i32u: 1488*9880d681SAndroid Build Coastguard Worker; AVX512CD: # BB#0: 1489*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,32,0] 1490*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: retq 1491*9880d681SAndroid Build Coastguard Worker; 1492*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: foldv4i32u: 1493*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 1494*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movaps {{.*#+}} xmm0 = [8,0,32,0] 1495*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 1496*9880d681SAndroid Build Coastguard Worker %out = call <4 x i32> @llvm.cttz.v4i32(<4 x i32> <i32 256, i32 -1, i32 0, i32 255>, i1 -1) 1497*9880d681SAndroid Build Coastguard Worker ret <4 x i32> %out 1498*9880d681SAndroid Build Coastguard Worker} 1499*9880d681SAndroid Build Coastguard Worker 1500*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @foldv8i16() nounwind { 1501*9880d681SAndroid Build Coastguard Worker; SSE-LABEL: foldv8i16: 1502*9880d681SAndroid Build Coastguard Worker; SSE: # BB#0: 1503*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: movaps {{.*#+}} xmm0 = [8,0,16,0,16,0,3,3] 1504*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: retq 1505*9880d681SAndroid Build Coastguard Worker; 1506*9880d681SAndroid Build Coastguard Worker; AVX1-LABEL: foldv8i16: 1507*9880d681SAndroid Build Coastguard Worker; AVX1: # BB#0: 1508*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,16,0,16,0,3,3] 1509*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: retq 1510*9880d681SAndroid Build Coastguard Worker; 1511*9880d681SAndroid Build Coastguard Worker; AVX2-LABEL: foldv8i16: 1512*9880d681SAndroid Build Coastguard Worker; AVX2: # BB#0: 1513*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,16,0,16,0,3,3] 1514*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: retq 1515*9880d681SAndroid Build Coastguard Worker; 1516*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-LABEL: foldv8i16: 1517*9880d681SAndroid Build Coastguard Worker; AVX512CDVL: # BB#0: 1518*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm0 = [8,0,16,0,16,0,3,3] 1519*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: retq 1520*9880d681SAndroid Build Coastguard Worker; 1521*9880d681SAndroid Build Coastguard Worker; AVX512CD-LABEL: foldv8i16: 1522*9880d681SAndroid Build Coastguard Worker; AVX512CD: # BB#0: 1523*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,16,0,16,0,3,3] 1524*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: retq 1525*9880d681SAndroid Build Coastguard Worker; 1526*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: foldv8i16: 1527*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 1528*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movaps {{.*#+}} xmm0 = [8,0,16,0,16,0,3,3] 1529*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 1530*9880d681SAndroid Build Coastguard Worker %out = call <8 x i16> @llvm.cttz.v8i16(<8 x i16> <i16 256, i16 -1, i16 0, i16 255, i16 -65536, i16 7, i16 24, i16 88>, i1 0) 1531*9880d681SAndroid Build Coastguard Worker ret <8 x i16> %out 1532*9880d681SAndroid Build Coastguard Worker} 1533*9880d681SAndroid Build Coastguard Worker 1534*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @foldv8i16u() nounwind { 1535*9880d681SAndroid Build Coastguard Worker; SSE-LABEL: foldv8i16u: 1536*9880d681SAndroid Build Coastguard Worker; SSE: # BB#0: 1537*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: movaps {{.*#+}} xmm0 = [8,0,16,0,16,0,3,3] 1538*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: retq 1539*9880d681SAndroid Build Coastguard Worker; 1540*9880d681SAndroid Build Coastguard Worker; AVX1-LABEL: foldv8i16u: 1541*9880d681SAndroid Build Coastguard Worker; AVX1: # BB#0: 1542*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,16,0,16,0,3,3] 1543*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: retq 1544*9880d681SAndroid Build Coastguard Worker; 1545*9880d681SAndroid Build Coastguard Worker; AVX2-LABEL: foldv8i16u: 1546*9880d681SAndroid Build Coastguard Worker; AVX2: # BB#0: 1547*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,16,0,16,0,3,3] 1548*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: retq 1549*9880d681SAndroid Build Coastguard Worker; 1550*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-LABEL: foldv8i16u: 1551*9880d681SAndroid Build Coastguard Worker; AVX512CDVL: # BB#0: 1552*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm0 = [8,0,16,0,16,0,3,3] 1553*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: retq 1554*9880d681SAndroid Build Coastguard Worker; 1555*9880d681SAndroid Build Coastguard Worker; AVX512CD-LABEL: foldv8i16u: 1556*9880d681SAndroid Build Coastguard Worker; AVX512CD: # BB#0: 1557*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,16,0,16,0,3,3] 1558*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: retq 1559*9880d681SAndroid Build Coastguard Worker; 1560*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: foldv8i16u: 1561*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 1562*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movaps {{.*#+}} xmm0 = [8,0,16,0,16,0,3,3] 1563*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 1564*9880d681SAndroid Build Coastguard Worker %out = call <8 x i16> @llvm.cttz.v8i16(<8 x i16> <i16 256, i16 -1, i16 0, i16 255, i16 -65536, i16 7, i16 24, i16 88>, i1 -1) 1565*9880d681SAndroid Build Coastguard Worker ret <8 x i16> %out 1566*9880d681SAndroid Build Coastguard Worker} 1567*9880d681SAndroid Build Coastguard Worker 1568*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @foldv16i8() nounwind { 1569*9880d681SAndroid Build Coastguard Worker; SSE-LABEL: foldv16i8: 1570*9880d681SAndroid Build Coastguard Worker; SSE: # BB#0: 1571*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: movaps {{.*#+}} xmm0 = [8,0,8,0,8,0,3,3,1,1,0,1,2,3,4,5] 1572*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: retq 1573*9880d681SAndroid Build Coastguard Worker; 1574*9880d681SAndroid Build Coastguard Worker; AVX1-LABEL: foldv16i8: 1575*9880d681SAndroid Build Coastguard Worker; AVX1: # BB#0: 1576*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,8,0,8,0,3,3,1,1,0,1,2,3,4,5] 1577*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: retq 1578*9880d681SAndroid Build Coastguard Worker; 1579*9880d681SAndroid Build Coastguard Worker; AVX2-LABEL: foldv16i8: 1580*9880d681SAndroid Build Coastguard Worker; AVX2: # BB#0: 1581*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,8,0,8,0,3,3,1,1,0,1,2,3,4,5] 1582*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: retq 1583*9880d681SAndroid Build Coastguard Worker; 1584*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-LABEL: foldv16i8: 1585*9880d681SAndroid Build Coastguard Worker; AVX512CDVL: # BB#0: 1586*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm0 = [8,0,8,0,8,0,3,3,1,1,0,1,2,3,4,5] 1587*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: retq 1588*9880d681SAndroid Build Coastguard Worker; 1589*9880d681SAndroid Build Coastguard Worker; AVX512CD-LABEL: foldv16i8: 1590*9880d681SAndroid Build Coastguard Worker; AVX512CD: # BB#0: 1591*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,8,0,8,0,3,3,1,1,0,1,2,3,4,5] 1592*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: retq 1593*9880d681SAndroid Build Coastguard Worker; 1594*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: foldv16i8: 1595*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 1596*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movaps {{.*#+}} xmm0 = [8,0,8,0,8,0,3,3,1,1,0,1,2,3,4,5] 1597*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 1598*9880d681SAndroid Build Coastguard Worker %out = call <16 x i8> @llvm.cttz.v16i8(<16 x i8> <i8 256, i8 -1, i8 0, i8 255, i8 -65536, i8 7, i8 24, i8 88, i8 -2, i8 254, i8 1, i8 2, i8 4, i8 8, i8 16, i8 32>, i1 0) 1599*9880d681SAndroid Build Coastguard Worker ret <16 x i8> %out 1600*9880d681SAndroid Build Coastguard Worker} 1601*9880d681SAndroid Build Coastguard Worker 1602*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @foldv16i8u() nounwind { 1603*9880d681SAndroid Build Coastguard Worker; SSE-LABEL: foldv16i8u: 1604*9880d681SAndroid Build Coastguard Worker; SSE: # BB#0: 1605*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: movaps {{.*#+}} xmm0 = [8,0,8,0,8,0,3,3,1,1,0,1,2,3,4,5] 1606*9880d681SAndroid Build Coastguard Worker; SSE-NEXT: retq 1607*9880d681SAndroid Build Coastguard Worker; 1608*9880d681SAndroid Build Coastguard Worker; AVX1-LABEL: foldv16i8u: 1609*9880d681SAndroid Build Coastguard Worker; AVX1: # BB#0: 1610*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,8,0,8,0,3,3,1,1,0,1,2,3,4,5] 1611*9880d681SAndroid Build Coastguard Worker; AVX1-NEXT: retq 1612*9880d681SAndroid Build Coastguard Worker; 1613*9880d681SAndroid Build Coastguard Worker; AVX2-LABEL: foldv16i8u: 1614*9880d681SAndroid Build Coastguard Worker; AVX2: # BB#0: 1615*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,8,0,8,0,3,3,1,1,0,1,2,3,4,5] 1616*9880d681SAndroid Build Coastguard Worker; AVX2-NEXT: retq 1617*9880d681SAndroid Build Coastguard Worker; 1618*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-LABEL: foldv16i8u: 1619*9880d681SAndroid Build Coastguard Worker; AVX512CDVL: # BB#0: 1620*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: vmovdqa64 {{.*#+}} xmm0 = [8,0,8,0,8,0,3,3,1,1,0,1,2,3,4,5] 1621*9880d681SAndroid Build Coastguard Worker; AVX512CDVL-NEXT: retq 1622*9880d681SAndroid Build Coastguard Worker; 1623*9880d681SAndroid Build Coastguard Worker; AVX512CD-LABEL: foldv16i8u: 1624*9880d681SAndroid Build Coastguard Worker; AVX512CD: # BB#0: 1625*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: vmovaps {{.*#+}} xmm0 = [8,0,8,0,8,0,3,3,1,1,0,1,2,3,4,5] 1626*9880d681SAndroid Build Coastguard Worker; AVX512CD-NEXT: retq 1627*9880d681SAndroid Build Coastguard Worker; 1628*9880d681SAndroid Build Coastguard Worker; X32-SSE-LABEL: foldv16i8u: 1629*9880d681SAndroid Build Coastguard Worker; X32-SSE: # BB#0: 1630*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: movaps {{.*#+}} xmm0 = [8,0,8,0,8,0,3,3,1,1,0,1,2,3,4,5] 1631*9880d681SAndroid Build Coastguard Worker; X32-SSE-NEXT: retl 1632*9880d681SAndroid Build Coastguard Worker %out = call <16 x i8> @llvm.cttz.v16i8(<16 x i8> <i8 256, i8 -1, i8 0, i8 255, i8 -65536, i8 7, i8 24, i8 88, i8 -2, i8 254, i8 1, i8 2, i8 4, i8 8, i8 16, i8 32>, i1 -1) 1633*9880d681SAndroid Build Coastguard Worker ret <16 x i8> %out 1634*9880d681SAndroid Build Coastguard Worker} 1635*9880d681SAndroid Build Coastguard Worker 1636*9880d681SAndroid Build Coastguard Workerdeclare <2 x i64> @llvm.cttz.v2i64(<2 x i64>, i1) 1637*9880d681SAndroid Build Coastguard Workerdeclare <4 x i32> @llvm.cttz.v4i32(<4 x i32>, i1) 1638*9880d681SAndroid Build Coastguard Workerdeclare <8 x i16> @llvm.cttz.v8i16(<8 x i16>, i1) 1639*9880d681SAndroid Build Coastguard Workerdeclare <16 x i8> @llvm.cttz.v16i8(<16 x i8>, i1) 1640