1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=x86-64 -mattr=+sse4.1 | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker 3*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: load_2_i8: 4*9880d681SAndroid Build Coastguard Worker; A single 16-bit load 5*9880d681SAndroid Build Coastguard Worker;CHECK: pmovzxbq 6*9880d681SAndroid Build Coastguard Worker;CHECK: paddq 7*9880d681SAndroid Build Coastguard Worker;CHECK: pshufb 8*9880d681SAndroid Build Coastguard Worker; A single 16-bit store 9*9880d681SAndroid Build Coastguard Worker;CHECK: movw 10*9880d681SAndroid Build Coastguard Worker;CHECK: ret 11*9880d681SAndroid Build Coastguard Worker 12*9880d681SAndroid Build Coastguard Workerdefine void @load_2_i8(<2 x i8>* %A) { 13*9880d681SAndroid Build Coastguard Worker %T = load <2 x i8>, <2 x i8>* %A 14*9880d681SAndroid Build Coastguard Worker %G = add <2 x i8> %T, <i8 9, i8 7> 15*9880d681SAndroid Build Coastguard Worker store <2 x i8> %G, <2 x i8>* %A 16*9880d681SAndroid Build Coastguard Worker ret void 17*9880d681SAndroid Build Coastguard Worker} 18*9880d681SAndroid Build Coastguard Worker 19*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: load_2_i16: 20*9880d681SAndroid Build Coastguard Worker; Read 32-bits 21*9880d681SAndroid Build Coastguard Worker;CHECK: pmovzxwq 22*9880d681SAndroid Build Coastguard Worker;CHECK: paddq 23*9880d681SAndroid Build Coastguard Worker;CHECK: pshufd 24*9880d681SAndroid Build Coastguard Worker;CHECK: movd 25*9880d681SAndroid Build Coastguard Worker;CHECK: ret 26*9880d681SAndroid Build Coastguard Workerdefine void @load_2_i16(<2 x i16>* %A) { 27*9880d681SAndroid Build Coastguard Worker %T = load <2 x i16>, <2 x i16>* %A 28*9880d681SAndroid Build Coastguard Worker %G = add <2 x i16> %T, <i16 9, i16 7> 29*9880d681SAndroid Build Coastguard Worker store <2 x i16> %G, <2 x i16>* %A 30*9880d681SAndroid Build Coastguard Worker ret void 31*9880d681SAndroid Build Coastguard Worker} 32*9880d681SAndroid Build Coastguard Worker 33*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: load_2_i32: 34*9880d681SAndroid Build Coastguard Worker;CHECK: pmovzxdq 35*9880d681SAndroid Build Coastguard Worker;CHECK: paddd 36*9880d681SAndroid Build Coastguard Worker;CHECK: pshufd 37*9880d681SAndroid Build Coastguard Worker;CHECK: ret 38*9880d681SAndroid Build Coastguard Workerdefine void @load_2_i32(<2 x i32>* %A) { 39*9880d681SAndroid Build Coastguard Worker %T = load <2 x i32>, <2 x i32>* %A 40*9880d681SAndroid Build Coastguard Worker %G = add <2 x i32> %T, <i32 9, i32 7> 41*9880d681SAndroid Build Coastguard Worker store <2 x i32> %G, <2 x i32>* %A 42*9880d681SAndroid Build Coastguard Worker ret void 43*9880d681SAndroid Build Coastguard Worker} 44*9880d681SAndroid Build Coastguard Worker 45*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: load_4_i8: 46*9880d681SAndroid Build Coastguard Worker;CHECK: pmovzxbd 47*9880d681SAndroid Build Coastguard Worker;CHECK: paddd 48*9880d681SAndroid Build Coastguard Worker;CHECK: pshufb 49*9880d681SAndroid Build Coastguard Worker;CHECK: ret 50*9880d681SAndroid Build Coastguard Workerdefine void @load_4_i8(<4 x i8>* %A) { 51*9880d681SAndroid Build Coastguard Worker %T = load <4 x i8>, <4 x i8>* %A 52*9880d681SAndroid Build Coastguard Worker %G = add <4 x i8> %T, <i8 1, i8 4, i8 9, i8 7> 53*9880d681SAndroid Build Coastguard Worker store <4 x i8> %G, <4 x i8>* %A 54*9880d681SAndroid Build Coastguard Worker ret void 55*9880d681SAndroid Build Coastguard Worker} 56*9880d681SAndroid Build Coastguard Worker 57*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: load_4_i16: 58*9880d681SAndroid Build Coastguard Worker;CHECK: pmovzxwd 59*9880d681SAndroid Build Coastguard Worker;CHECK: paddw 60*9880d681SAndroid Build Coastguard Worker;CHECK: pshufb 61*9880d681SAndroid Build Coastguard Worker;CHECK: ret 62*9880d681SAndroid Build Coastguard Workerdefine void @load_4_i16(<4 x i16>* %A) { 63*9880d681SAndroid Build Coastguard Worker %T = load <4 x i16>, <4 x i16>* %A 64*9880d681SAndroid Build Coastguard Worker %G = add <4 x i16> %T, <i16 1, i16 4, i16 9, i16 7> 65*9880d681SAndroid Build Coastguard Worker store <4 x i16> %G, <4 x i16>* %A 66*9880d681SAndroid Build Coastguard Worker ret void 67*9880d681SAndroid Build Coastguard Worker} 68*9880d681SAndroid Build Coastguard Worker 69*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: load_8_i8: 70*9880d681SAndroid Build Coastguard Worker;CHECK: pmovzxbw 71*9880d681SAndroid Build Coastguard Worker;CHECK: paddb 72*9880d681SAndroid Build Coastguard Worker;CHECK: pshufb 73*9880d681SAndroid Build Coastguard Worker;CHECK: ret 74*9880d681SAndroid Build Coastguard Workerdefine void @load_8_i8(<8 x i8>* %A) { 75*9880d681SAndroid Build Coastguard Worker %T = load <8 x i8>, <8 x i8>* %A 76*9880d681SAndroid Build Coastguard Worker %G = add <8 x i8> %T, %T 77*9880d681SAndroid Build Coastguard Worker store <8 x i8> %G, <8 x i8>* %A 78*9880d681SAndroid Build Coastguard Worker ret void 79*9880d681SAndroid Build Coastguard Worker} 80